diff --git "a/results.json" "b/results.json" --- "a/results.json" +++ "b/results.json" @@ -1,386882 +1,15290 @@ [ { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.5592169701, - "sentence_nr":0 + "score":0.2144530934 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.7187320759, - "sentence_nr":0 + "score":0.499609058 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ar", + "task":"translation_to", "metric":"bleu", - "score":0.4438455476, - "sentence_nr":0 + "score":0.3307884966 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ar", + "task":"translation_to", "metric":"chrf", - "score":0.6320800719, - "sentence_nr":0 + "score":0.5479156427 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", + "model":"amazon\/nova-micro-v1", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.5894973559, - "sentence_nr":0 + "score":0.193036151 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", + "model":"amazon\/nova-micro-v1", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.7562097957, - "sentence_nr":0 + "score":0.4366975641 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"bn", + "task":"translation_to", "metric":"bleu", - "score":0.3846086977, - "sentence_nr":0 + "score":0.2512647986 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"bn", + "task":"translation_to", "metric":"chrf", - "score":0.5835344719, - "sentence_nr":0 + "score":0.4387026201 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", + "model":"amazon\/nova-micro-v1", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.4440401202, - "sentence_nr":0 + "score":0.249655311 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", + "model":"amazon\/nova-micro-v1", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.634367012, - "sentence_nr":0 + "score":0.4987192142 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"de", + "task":"translation_to", "metric":"bleu", - "score":0.3742128962, - "sentence_nr":0 + "score":0.3783450256 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"de", + "task":"translation_to", "metric":"chrf", - "score":0.5924994298, - "sentence_nr":0 + "score":0.5970718288 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", + "model":"amazon\/nova-micro-v1", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.3206397177, - "sentence_nr":0 + "score":0.4813757383 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", + "model":"amazon\/nova-micro-v1", + "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.5206258402, - "sentence_nr":0 + "score":0.6701342658 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"en", + "task":"translation_to", "metric":"bleu", - "score":0.390861271, - "sentence_nr":0 + "score":0.5512931433 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"en", + "task":"translation_to", "metric":"chrf", - "score":0.6239956806, - "sentence_nr":0 + "score":0.763108119 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"amazon\/nova-micro-v1", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.3020679768, - "sentence_nr":0 + "score":0.2057312363 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"amazon\/nova-micro-v1", + "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.5246291817, - "sentence_nr":0 + "score":0.4645708907 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"es", + "task":"translation_to", "metric":"bleu", - "score":0.3629639414, - "sentence_nr":0 + "score":0.3335475603 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"es", + "task":"translation_to", "metric":"chrf", - "score":0.5313865724, - "sentence_nr":0 + "score":0.5654042924 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", + "model":"amazon\/nova-micro-v1", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.8780634321, - "sentence_nr":0 + "score":0.2522597451 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", + "model":"amazon\/nova-micro-v1", + "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.9269467001, - "sentence_nr":0 + "score":0.5010466238 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"fr", + "task":"translation_to", "metric":"bleu", - "score":0.7964573358, - "sentence_nr":0 + "score":0.4197992651 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"fr", + "task":"translation_to", "metric":"chrf", - "score":0.8458636472, - "sentence_nr":0 + "score":0.608198896 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"amazon\/nova-micro-v1", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"amazon\/nova-micro-v1", "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":1.0, - "sentence_nr":0 + "score":0.3499000643 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"amazon\/nova-micro-v1", "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":1.0, - "sentence_nr":0 + "score":0.5900050545 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"amazon\/nova-micro-v1", "bcp_47":"hi", - "task":"translation_from", + "task":"translation_to", "metric":"bleu", - "score":0.9452996323, - "sentence_nr":0 + "score":0.3771214193 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"amazon\/nova-micro-v1", "bcp_47":"hi", - "task":"translation_from", + "task":"translation_to", "metric":"chrf", - "score":0.9463396364, - "sentence_nr":0 + "score":0.5828460278 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"amazon\/nova-micro-v1", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.8781548422, - "sentence_nr":0 + "score":0.1774899549 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"amazon\/nova-micro-v1", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.9156314785, - "sentence_nr":0 + "score":0.4606519655 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"id", + "task":"translation_to", "metric":"bleu", - "score":0.3240643366, - "sentence_nr":0 + "score":0.1527125759 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"id", + "task":"translation_to", "metric":"chrf", - "score":0.5243586267, - "sentence_nr":0 + "score":0.5471305127 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.3463367232, - "sentence_nr":0 + "score":0.2535676165 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.5378805625, - "sentence_nr":0 + "score":0.5161759227 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ja", + "task":"translation_to", "metric":"bleu", - "score":0.3852076286, - "sentence_nr":0 + "score":0.3421090766 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ja", + "task":"translation_to", "metric":"chrf", - "score":0.562982276, - "sentence_nr":0 + "score":0.4832285924 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", + "model":"amazon\/nova-micro-v1", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.2602101451, - "sentence_nr":0 + "score":0.2559752722 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", + "model":"amazon\/nova-micro-v1", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.4820043661, - "sentence_nr":0 + "score":0.4824824422 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"jv", + "task":"translation_to", "metric":"bleu", - "score":0.3207234978, - "sentence_nr":0 + "score":0.1620132742 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"jv", + "task":"translation_to", "metric":"chrf", - "score":0.4977201244, - "sentence_nr":0 + "score":0.4958991194 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", + "model":"amazon\/nova-micro-v1", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.4318843329, - "sentence_nr":0 + "score":0.1417986092 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", + "model":"amazon\/nova-micro-v1", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.6011096109, - "sentence_nr":0 + "score":0.4193263814 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"mr", + "task":"translation_to", "metric":"bleu", - "score":0.3582301851, - "sentence_nr":0 + "score":0.1222453955 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"mr", + "task":"translation_to", "metric":"chrf", - "score":0.5380305838, - "sentence_nr":0 + "score":0.3265542088 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", + "model":"amazon\/nova-micro-v1", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.4417559394, - "sentence_nr":0 + "score":0.3643913289 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", + "model":"amazon\/nova-micro-v1", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.6111096353, - "sentence_nr":0 + "score":0.5978521406 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"pa", + "task":"translation_to", "metric":"bleu", - "score":0.3905612193, - "sentence_nr":0 + "score":0.3487197391 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"pa", + "task":"translation_to", "metric":"chrf", - "score":0.5861956607, - "sentence_nr":0 + "score":0.4994988579 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", + "model":"amazon\/nova-micro-v1", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.4354870568, - "sentence_nr":0 + "score":0.2674020405 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", + "model":"amazon\/nova-micro-v1", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.6005516255, - "sentence_nr":0 + "score":0.4916276462 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"pt", + "task":"translation_to", "metric":"bleu", - "score":0.4641883722, - "sentence_nr":0 + "score":0.449593878 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"pt", + "task":"translation_to", "metric":"chrf", - "score":0.640326715, - "sentence_nr":0 + "score":0.6517684253 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.3007405773, - "sentence_nr":0 + "score":0.1691106182 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.5272774705, - "sentence_nr":0 + "score":0.4371008423 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ru", + "task":"translation_to", "metric":"bleu", - "score":0.40610665, - "sentence_nr":0 + "score":0.3132986377 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ru", + "task":"translation_to", "metric":"chrf", - "score":0.6080346531, - "sentence_nr":0 + "score":0.559742916 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.3152039044, - "sentence_nr":0 + "score":0.1944514657 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.566675397, - "sentence_nr":0 + "score":0.4363680283 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sw", + "task":"translation_to", "metric":"bleu", - "score":0.4045482503, - "sentence_nr":0 + "score":0.2507279258 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"sw", + "task":"translation_to", "metric":"chrf", - "score":0.5951482608, - "sentence_nr":0 + "score":0.5456882386 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", + "model":"amazon\/nova-micro-v1", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.4422044706, - "sentence_nr":0 + "score":0.2351879022 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", + "model":"amazon\/nova-micro-v1", + "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.6089032707, - "sentence_nr":0 + "score":0.5015135666 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"te", + "task":"translation_to", "metric":"bleu", - "score":0.3099603853, - "sentence_nr":0 + "score":0.2443279394 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"te", + "task":"translation_to", "metric":"chrf", - "score":0.5209233177, - "sentence_nr":0 + "score":0.4616934816 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.3093921662, - "sentence_nr":0 + "score":0.2239109073 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.5208328629, - "sentence_nr":0 + "score":0.4664590257 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ur", + "task":"translation_to", "metric":"bleu", - "score":0.2417404985, - "sentence_nr":0 + "score":0.1004419383 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"ur", + "task":"translation_to", "metric":"chrf", - "score":0.4540589962, - "sentence_nr":0 + "score":0.3466465332 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", + "model":"amazon\/nova-micro-v1", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.3443388178, - "sentence_nr":0 + "score":0.1579119983 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", + "model":"amazon\/nova-micro-v1", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.5341360898, - "sentence_nr":0 + "score":0.4176784236 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"vi", + "task":"translation_to", "metric":"bleu", - "score":0.4331131004, - "sentence_nr":0 + "score":0.2143148158 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"vi", + "task":"translation_to", "metric":"chrf", - "score":0.5898969623, - "sentence_nr":0 + "score":0.4814311669 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", + "model":"amazon\/nova-micro-v1", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"amazon\/nova-micro-v1", + "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.3558039927, - "sentence_nr":0 + "score":0.1837575642 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", + "model":"amazon\/nova-micro-v1", + "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.5392592206, - "sentence_nr":0 + "score":0.4701178189 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"zh", + "task":"translation_to", "metric":"bleu", - "score":0.4072470239, - "sentence_nr":0 + "score":0.2769852176 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", + "model":"amazon\/nova-micro-v1", + "bcp_47":"zh", + "task":"translation_to", "metric":"chrf", - "score":0.5650294312, - "sentence_nr":0 + "score":0.3191136721 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.3741026208, - "sentence_nr":0 + "score":0.2700460204 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.5834523244, - "sentence_nr":0 + "score":0.5538421491 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ar", + "task":"translation_to", "metric":"bleu", - "score":0.3938763752, - "sentence_nr":0 + "score":0.3429486101 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ar", + "task":"translation_to", "metric":"chrf", - "score":0.5909459754, - "sentence_nr":0 + "score":0.585338958 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", + "model":"deepseek\/deepseek-chat", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.5274220384, - "sentence_nr":0 + "score":0.2518742297 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", + "model":"deepseek\/deepseek-chat", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.676558814, - "sentence_nr":0 + "score":0.4808653185 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"bn", + "task":"translation_to", "metric":"bleu", - "score":0.3931738146, - "sentence_nr":0 + "score":0.3262591736 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"bn", + "task":"translation_to", "metric":"chrf", - "score":0.6026058741, - "sentence_nr":0 + "score":0.5167211951 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", + "model":"deepseek\/deepseek-chat", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.3229030612, - "sentence_nr":0 + "score":0.296094691 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", + "model":"deepseek\/deepseek-chat", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.5136703373, - "sentence_nr":0 + "score":0.5405203037 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"de", + "task":"translation_to", "metric":"bleu", - "score":0.3113772787, - "sentence_nr":0 + "score":0.4521703872 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"de", + "task":"translation_to", "metric":"chrf", - "score":0.5344680037, - "sentence_nr":0 + "score":0.6510137978 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", + "model":"deepseek\/deepseek-chat", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.4015176111, - "sentence_nr":0 + "score":0.5350598812 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", + "model":"deepseek\/deepseek-chat", + "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.5570033942, - "sentence_nr":0 + "score":0.6920702898 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"en", + "task":"translation_to", "metric":"bleu", - "score":0.427346675, - "sentence_nr":0 + "score":0.6197100322 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"en", + "task":"translation_to", "metric":"chrf", - "score":0.6397906518, - "sentence_nr":0 + "score":0.7935529886 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", + "model":"deepseek\/deepseek-chat", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.4893093641, - "sentence_nr":0 + "score":0.3328054743 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", + "model":"deepseek\/deepseek-chat", + "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.6990856292, - "sentence_nr":0 + "score":0.5621761866 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"es", + "task":"translation_to", "metric":"bleu", - "score":0.4951704011, - "sentence_nr":0 + "score":0.3056069517 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"es", + "task":"translation_to", "metric":"chrf", - "score":0.6726500193, - "sentence_nr":0 + "score":0.5864625476 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", + "model":"deepseek\/deepseek-chat", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.474262745, - "sentence_nr":0 + "score":0.3183976094 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", + "model":"deepseek\/deepseek-chat", + "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.6547171932, - "sentence_nr":0 + "score":0.5810941349 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"fr", + "task":"translation_to", "metric":"bleu", - "score":0.5534262126, - "sentence_nr":0 + "score":0.4748705901 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"fr", + "task":"translation_to", "metric":"chrf", - "score":0.7517262393, - "sentence_nr":0 + "score":0.6771774372 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", + "model":"deepseek\/deepseek-chat", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.3692194586, - "sentence_nr":0 + "score":0.3380504047 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", + "model":"deepseek\/deepseek-chat", + "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.5602656573, - "sentence_nr":0 + "score":0.5712827315 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"hi", + "task":"translation_to", "metric":"bleu", - "score":0.3963410286, - "sentence_nr":0 + "score":0.4099090208 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"hi", + "task":"translation_to", "metric":"chrf", - "score":0.6131661903, - "sentence_nr":0 + "score":0.6013300104 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", + "model":"deepseek\/deepseek-chat", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.3905898585, - "sentence_nr":0 + "score":0.2977952957 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", + "model":"deepseek\/deepseek-chat", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.5498108215, - "sentence_nr":0 + "score":0.5374664029 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"id", + "task":"translation_to", "metric":"bleu", - "score":0.3343350399, - "sentence_nr":0 + "score":0.3176178107 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"id", + "task":"translation_to", "metric":"chrf", - "score":0.5465517654, - "sentence_nr":0 + "score":0.6263788011 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.4509623706, - "sentence_nr":0 + "score":0.2817398654 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.6276175882, - "sentence_nr":0 + "score":0.5582480948 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ja", + "task":"translation_to", "metric":"bleu", - "score":0.4404175157, - "sentence_nr":0 + "score":0.4310206038 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ja", + "task":"translation_to", "metric":"chrf", - "score":0.649940095, - "sentence_nr":0 + "score":0.5648545023 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", + "model":"deepseek\/deepseek-chat", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.4429424771, - "sentence_nr":0 + "score":0.3061246587 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", + "model":"deepseek\/deepseek-chat", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.5915660675, - "sentence_nr":0 + "score":0.523750141 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"jv", + "task":"translation_to", "metric":"bleu", - "score":0.418987297, - "sentence_nr":0 + "score":0.2727123426 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"jv", + "task":"translation_to", "metric":"chrf", - "score":0.5748791698, - "sentence_nr":0 + "score":0.5748905525 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", + "model":"deepseek\/deepseek-chat", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.202098372, - "sentence_nr":0 + "score":0.2242946033 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", + "model":"deepseek\/deepseek-chat", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.4110516731, - "sentence_nr":0 + "score":0.5097037063 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"mr", + "task":"translation_to", "metric":"bleu", - "score":0.2970536843, - "sentence_nr":0 + "score":0.2137264994 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"mr", + "task":"translation_to", "metric":"chrf", - "score":0.5186257966, - "sentence_nr":0 + "score":0.440475376 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", + "model":"deepseek\/deepseek-chat", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.0740715445, - "sentence_nr":1 + "score":0.43589074 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", + "model":"deepseek\/deepseek-chat", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.4314543453, - "sentence_nr":1 + "score":0.6610423251 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"pa", + "task":"translation_to", "metric":"bleu", - "score":0.1290369606, - "sentence_nr":1 + "score":0.3781104049 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"pa", + "task":"translation_to", "metric":"chrf", - "score":0.456225988, - "sentence_nr":1 + "score":0.5478926249 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", + "model":"deepseek\/deepseek-chat", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":1 + "score":0.3335410498 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", + "model":"deepseek\/deepseek-chat", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.0244593913, - "sentence_nr":1 + "score":0.5672032656 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"pt", + "task":"translation_to", "metric":"bleu", - "score":0.1235182482, - "sentence_nr":1 + "score":0.4580630889 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"pt", + "task":"translation_to", "metric":"chrf", - "score":0.4682275447, - "sentence_nr":1 + "score":0.6657392427 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.1622106093, - "sentence_nr":1 + "score":0.2587147192 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.5093553102, - "sentence_nr":1 + "score":0.5313277465 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ru", + "task":"translation_to", "metric":"bleu", - "score":0.066471681, - "sentence_nr":1 + "score":0.3724063678 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ru", + "task":"translation_to", "metric":"chrf", - "score":0.3435083262, - "sentence_nr":1 + "score":0.5962061241 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.1256067288, - "sentence_nr":1 + "score":0.2269997511 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.496956026, - "sentence_nr":1 + "score":0.4842755902 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sw", + "task":"translation_to", "metric":"bleu", - "score":0.1707705852, - "sentence_nr":1 + "score":0.3044437459 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"sw", + "task":"translation_to", "metric":"chrf", - "score":0.5022008375, - "sentence_nr":1 + "score":0.6117061265 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"deepseek\/deepseek-chat", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.1078475606, - "sentence_nr":1 + "score":0.290563665 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"deepseek\/deepseek-chat", + "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.4427230465, - "sentence_nr":1 + "score":0.5273017096 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"te", + "task":"translation_to", "metric":"bleu", - "score":0.0797339583, - "sentence_nr":1 + "score":0.2358621489 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"te", + "task":"translation_to", "metric":"chrf", - "score":0.4418411387, - "sentence_nr":1 + "score":0.4806590073 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.0973598172, - "sentence_nr":1 + "score":0.2429196873 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.3528893466, - "sentence_nr":1 + "score":0.5008155104 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ur", + "task":"translation_to", "metric":"bleu", - "score":0.0827317824, - "sentence_nr":1 + "score":0.3049495338 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"ur", + "task":"translation_to", "metric":"chrf", - "score":0.3639966646, - "sentence_nr":1 + "score":0.4791605551 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", + "model":"deepseek\/deepseek-chat", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.1301287033, - "sentence_nr":1 + "score":0.2408476334 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", + "model":"deepseek\/deepseek-chat", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.385283552, - "sentence_nr":1 + "score":0.4988564858 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"vi", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":1 + "score":0.2703596899 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"vi", + "task":"translation_to", "metric":"chrf", - "score":0.3356633416, - "sentence_nr":1 + "score":0.5116028165 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"deepseek\/deepseek-chat", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat", + "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.0965691457, - "sentence_nr":1 + "score":0.2376852279 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"deepseek\/deepseek-chat", + "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.3802997171, - "sentence_nr":1 + "score":0.5256489144 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"zh", + "task":"translation_to", "metric":"bleu", - "score":0.1156401289, - "sentence_nr":1 + "score":0.2792207353 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", + "model":"deepseek\/deepseek-chat", + "bcp_47":"zh", + "task":"translation_to", "metric":"chrf", - "score":0.4459978368, - "sentence_nr":1 + "score":0.3511763987 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.1260148278, - "sentence_nr":1 + "score":0.201730622 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.4359566525, - "sentence_nr":1 + "score":0.5230392495 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ar", + "task":"translation_to", "metric":"bleu", - "score":0.120222864, - "sentence_nr":1 + "score":0.3852105985 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ar", + "task":"translation_to", "metric":"chrf", - "score":0.4827998681, - "sentence_nr":1 + "score":0.605693575 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.1535037749, - "sentence_nr":1 + "score":0.2515106137 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.4764514844, - "sentence_nr":1 + "score":0.5085911882 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"bn", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":1 + "score":0.2989934852 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"bn", + "task":"translation_to", "metric":"chrf", - "score":0.432913173, - "sentence_nr":1 + "score":0.4923392967 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":1 + "score":0.2947779952 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.2521233582, - "sentence_nr":1 + "score":0.5363074175 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"de", + "task":"translation_to", "metric":"bleu", - "score":0.4095908744, - "sentence_nr":1 + "score":0.3523906614 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"de", + "task":"translation_to", "metric":"chrf", - "score":0.6348509381, - "sentence_nr":1 + "score":0.5431292252 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.4095908744, - "sentence_nr":1 + "score":0.3549731332 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.6348509381, - "sentence_nr":1 + "score":0.516110221 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"en", + "task":"translation_to", "metric":"bleu", - "score":0.3182970444, - "sentence_nr":1 + "score":0.5306797494 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"en", + "task":"translation_to", "metric":"chrf", - "score":0.595316257, - "sentence_nr":1 + "score":0.7137131706 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.2154426819, - "sentence_nr":1 + "score":0.2686376487 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.5620944561, - "sentence_nr":1 + "score":0.5150941143 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"es", + "task":"translation_to", "metric":"bleu", - "score":0.0867932999, - "sentence_nr":1 + "score":0.2858074351 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"es", + "task":"translation_to", "metric":"chrf", - "score":0.4201964133, - "sentence_nr":1 + "score":0.5391420281 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.0821410657, - "sentence_nr":1 + "score":0.2992701671 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.3969463878, - "sentence_nr":1 + "score":0.5475268989 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fr", + "task":"translation_to", "metric":"bleu", - "score":0.1897299381, - "sentence_nr":1 + "score":0.3905037889 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"fr", + "task":"translation_to", "metric":"chrf", - "score":0.5086851538, - "sentence_nr":1 + "score":0.6068698391 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":1 + "score":0.3538422525 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.3833939462, - "sentence_nr":1 + "score":0.5862254357 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"hi", + "task":"translation_to", "metric":"bleu", - "score":0.0829682579, - "sentence_nr":1 + "score":0.41385038 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"hi", + "task":"translation_to", "metric":"chrf", - "score":0.384929236, - "sentence_nr":1 + "score":0.6049826714 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":1 + "score":0.3007180384 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.3630576976, - "sentence_nr":1 + "score":0.5023246329 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"id", + "task":"translation_to", "metric":"bleu", - "score":0.0744904632, - "sentence_nr":1 + "score":0.334501536 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"id", + "task":"translation_to", "metric":"chrf", - "score":0.4111163206, - "sentence_nr":1 + "score":0.6312038844 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":1 + "score":0.2664302142 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.43631303, - "sentence_nr":1 + "score":0.5511307577 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ja", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":1 + "score":0.3695096312 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ja", + "task":"translation_to", "metric":"chrf", - "score":0.4174727607, - "sentence_nr":1 + "score":0.5016072256 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":1 + "score":0.2557256216 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.4278386149, - "sentence_nr":1 + "score":0.4694930912 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"jv", + "task":"translation_to", "metric":"bleu", - "score":0.0861671109, - "sentence_nr":1 + "score":0.2301023035 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"jv", + "task":"translation_to", "metric":"chrf", - "score":0.3696512763, - "sentence_nr":1 + "score":0.5333883608 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.1289410403, - "sentence_nr":1 + "score":0.2389669394 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.4486368935, - "sentence_nr":1 + "score":0.4384602668 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"mr", + "task":"translation_to", "metric":"bleu", - "score":0.0882525219, - "sentence_nr":1 + "score":0.1906304694 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"mr", + "task":"translation_to", "metric":"chrf", - "score":0.4377853722, - "sentence_nr":1 + "score":0.43321511 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.0534513757, - "sentence_nr":1 + "score":0.2890532438 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.3829169125, - "sentence_nr":1 + "score":0.5744900625 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"pa", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":1 + "score":0.2023348505 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"pa", + "task":"translation_to", "metric":"chrf", - "score":0.4024696873, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1538602933, - "sentence_nr":1 + "score":0.4209687673 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"deepseek\/deepseek-chat-v3-0324", "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4391148259, - "sentence_nr":1 + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"deepseek\/deepseek-chat-v3-0324", "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.1007092756, - "sentence_nr":1 + "score":0.3077173175 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"deepseek\/deepseek-chat-v3-0324", "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.4371822026, - "sentence_nr":1 + "score":0.5684889974 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"deepseek\/deepseek-chat-v3-0324", "bcp_47":"pt", - "task":"translation_from", + "task":"translation_to", "metric":"bleu", - "score":0.1147846313, - "sentence_nr":1 + "score":0.3988769765 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"deepseek\/deepseek-chat-v3-0324", "bcp_47":"pt", - "task":"translation_from", + "task":"translation_to", "metric":"chrf", - "score":0.4651957502, - "sentence_nr":1 + "score":0.6526950425 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.0713710158, - "sentence_nr":1 + "score":0.1939421958 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.4075406301, - "sentence_nr":1 + "score":0.4613061334 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ru", + "task":"translation_to", "metric":"bleu", - "score":0.0846581996, - "sentence_nr":1 + "score":0.2954667205 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ru", + "task":"translation_to", "metric":"chrf", - "score":0.4509865769, - "sentence_nr":1 + "score":0.4928272924 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":1 + "score":0.2244277924 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.1946966569, - "sentence_nr":1 + "score":0.4632403501 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sw", + "task":"translation_to", "metric":"bleu", - "score":0.0772718393, - "sentence_nr":1 + "score":0.2475167578 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"sw", + "task":"translation_to", "metric":"chrf", - "score":0.4203683137, - "sentence_nr":1 + "score":0.5859145482 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.0829135716, - "sentence_nr":1 + "score":0.2491270517 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.4009694997, - "sentence_nr":1 + "score":0.4971850787 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"te", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":1 + "score":0.230423487 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"te", + "task":"translation_to", "metric":"chrf", - "score":0.3714280467, - "sentence_nr":1 + "score":0.4572263206 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.0889905327, - "sentence_nr":1 + "score":0.2528912211 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.4022940284, - "sentence_nr":1 + "score":0.5471673071 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ur", + "task":"translation_to", "metric":"bleu", - "score":0.0612660422, - "sentence_nr":1 + "score":0.2890836127 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"ur", + "task":"translation_to", "metric":"chrf", - "score":0.3837677428, - "sentence_nr":1 + "score":0.4638645889 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.0756907194, - "sentence_nr":1 + "score":0.2182193511 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.4138725094, - "sentence_nr":1 + "score":0.4918690502 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"vi", + "task":"translation_to", "metric":"bleu", - "score":0.0886663742, - "sentence_nr":1 + "score":0.3051142824 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"vi", + "task":"translation_to", "metric":"chrf", - "score":0.4487646223, - "sentence_nr":1 + "score":0.5736498723 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.1057442843, - "sentence_nr":1 + "score":0.1267866191 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.453718146, - "sentence_nr":1 + "score":0.3661653956 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"zh", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":1 + "score":0.2217838799 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_from", + "model":"deepseek\/deepseek-chat-v3-0324", + "bcp_47":"zh", + "task":"translation_to", "metric":"chrf", - "score":0.4393340573, - "sentence_nr":1 + "score":0.3212219671 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", + "model":"deepseek\/deepseek-r1", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.1195053738, - "sentence_nr":1 + "score":0.1955321366 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", + "model":"deepseek\/deepseek-r1", + "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.451213629, - "sentence_nr":1 + "score":0.4452496338 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"ar", + "task":"translation_to", "metric":"bleu", - "score":0.2174835365, - "sentence_nr":1 + "score":0.3157575918 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"ar", + "task":"translation_to", "metric":"chrf", - "score":0.4462746463, - "sentence_nr":1 + "score":0.5012233036 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", + "model":"deepseek\/deepseek-r1", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.2444399937, - "sentence_nr":1 + "score":0.1735477119 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", + "model":"deepseek\/deepseek-r1", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.4991016393, - "sentence_nr":1 + "score":0.4036037512 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"bn", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":1 + "score":0.2603256448 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"bn", + "task":"translation_to", "metric":"chrf", - "score":0.3415556284, - "sentence_nr":1 + "score":0.4715465891 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"deepseek\/deepseek-r1", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.0889084344, - "sentence_nr":1 + "score":0.2350996731 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"deepseek\/deepseek-r1", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.3974812246, - "sentence_nr":1 + "score":0.4539868888 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"de", + "task":"translation_to", "metric":"bleu", - "score":0.3961285597, - "sentence_nr":2 + "score":0.4694847332 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"de", + "task":"translation_to", "metric":"chrf", - "score":0.6148751441, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.49237513, - "sentence_nr":2 + "score":0.6499890785 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"deepseek\/deepseek-r1", "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.685375649, - "sentence_nr":2 + "task":"mmlu", + "metric":"accuracy", + "score":0.0 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"deepseek\/deepseek-r1", "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.3996712648, - "sentence_nr":2 + "score":0.4790246882 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"deepseek\/deepseek-r1", "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.6353525756, - "sentence_nr":2 + "score":0.6389223375 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"deepseek\/deepseek-r1", "bcp_47":"en", - "task":"translation_from", + "task":"translation_to", "metric":"bleu", - "score":0.5115346945, - "sentence_nr":2 + "score":0.6184989115 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"deepseek\/deepseek-r1", "bcp_47":"en", - "task":"translation_from", + "task":"translation_to", "metric":"chrf", - "score":0.7037574716, - "sentence_nr":2 + "score":0.8037117471 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", + "model":"deepseek\/deepseek-r1", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.5396134765, - "sentence_nr":2 + "score":0.1802447888 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", + "model":"deepseek\/deepseek-r1", + "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.7656669576, - "sentence_nr":2 + "score":0.352852694 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"es", + "task":"translation_to", "metric":"bleu", - "score":0.1737495157, - "sentence_nr":2 + "score":0.32221956 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"es", + "task":"translation_to", "metric":"chrf", - "score":0.4532559788, - "sentence_nr":2 + "score":0.5945828154 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", + "model":"deepseek\/deepseek-r1", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.1774329946, - "sentence_nr":2 + "score":0.1396007132 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", + "model":"deepseek\/deepseek-r1", + "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.430712719, - "sentence_nr":2 + "score":0.2948285656 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"fr", + "task":"translation_to", "metric":"bleu", - "score":0.1605265407, - "sentence_nr":2 + "score":0.4626443841 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"fr", + "task":"translation_to", "metric":"chrf", - "score":0.4158012087, - "sentence_nr":2 + "score":0.6453178011 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"deepseek\/deepseek-r1", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.0596357961, - "sentence_nr":2 + "score":0.3248801173 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"deepseek\/deepseek-r1", + "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.3113976238, - "sentence_nr":2 + "score":0.5368976197 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"hi", + "task":"translation_to", "metric":"bleu", - "score":0.1688287853, - "sentence_nr":2 + "score":0.3477596714 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"hi", + "task":"translation_to", "metric":"chrf", - "score":0.4916588179, - "sentence_nr":2 + "score":0.542033928 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", + "model":"deepseek\/deepseek-r1", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.2680102298, - "sentence_nr":2 + "score":0.2034777205 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", + "model":"deepseek\/deepseek-r1", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.5654883865, - "sentence_nr":2 + "score":0.4787094647 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"id", + "task":"translation_to", "metric":"bleu", - "score":0.2166540719, - "sentence_nr":2 + "score":0.4161506758 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"id", + "task":"translation_to", "metric":"chrf", - "score":0.4344921443, - "sentence_nr":2 + "score":0.675862263 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", + "model":"deepseek\/deepseek-r1", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.2735429727, - "sentence_nr":2 + "score":0.2148759695 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", + "model":"deepseek\/deepseek-r1", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.5644723204, - "sentence_nr":2 + "score":0.4372780553 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"ja", + "task":"translation_to", "metric":"bleu", - "score":0.2022332245, - "sentence_nr":2 + "score":0.1725311936 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"ja", + "task":"translation_to", "metric":"chrf", - "score":0.5084057058, - "sentence_nr":2 + "score":0.3103103139 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"deepseek\/deepseek-r1", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.278351925, - "sentence_nr":2 + "score":0.3165472295 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"deepseek\/deepseek-r1", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.5348467461, - "sentence_nr":2 + "score":0.5345475991 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"jv", + "task":"translation_to", "metric":"bleu", - "score":0.3574583793, - "sentence_nr":2 + "score":0.2983221296 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"jv", + "task":"translation_to", "metric":"chrf", - "score":0.592411512, - "sentence_nr":2 + "score":0.5707529624 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", + "model":"deepseek\/deepseek-r1", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.3799465256, - "sentence_nr":2 + "score":0.1247777236 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", + "model":"deepseek\/deepseek-r1", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.6464467277, - "sentence_nr":2 + "score":0.2923162337 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"mr", + "task":"translation_to", "metric":"bleu", - "score":0.420650773, - "sentence_nr":2 + "score":0.1050598836 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"mr", + "task":"translation_to", "metric":"chrf", - "score":0.6788513036, - "sentence_nr":2 + "score":0.2683360352 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", + "model":"deepseek\/deepseek-r1", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.3536718074, - "sentence_nr":2 + "score":0.1844224826 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", + "model":"deepseek\/deepseek-r1", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.6344846207, - "sentence_nr":2 + "score":0.3422693726 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"pa", + "task":"translation_to", "metric":"bleu", - "score":0.4583059141, - "sentence_nr":2 + "score":0.1807039126 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"pa", + "task":"translation_to", "metric":"chrf", - "score":0.6572591476, - "sentence_nr":2 + "score":0.2632902709 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", + "model":"deepseek\/deepseek-r1", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.2229272631, - "sentence_nr":2 + "score":0.2434841819 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", + "model":"deepseek\/deepseek-r1", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.5653789748, - "sentence_nr":2 + "score":0.4532930974 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"pt", + "task":"translation_to", "metric":"bleu", - "score":0.0936226112, - "sentence_nr":2 + "score":0.4043131386 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"pt", + "task":"translation_to", "metric":"chrf", - "score":0.3452056942, - "sentence_nr":2 + "score":0.5936961583 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", + "model":"deepseek\/deepseek-r1", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.2693093705, - "sentence_nr":2 + "score":0.1866121683 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", + "model":"deepseek\/deepseek-r1", + "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.5410704186, - "sentence_nr":2 + "score":0.3995426351 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"ru", + "task":"translation_to", "metric":"bleu", - "score":0.2463476586, - "sentence_nr":2 + "score":0.3589759487 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"ru", + "task":"translation_to", "metric":"chrf", - "score":0.5596851385, - "sentence_nr":2 + "score":0.5459455358 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", + "model":"deepseek\/deepseek-r1", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.266398619, - "sentence_nr":2 + "score":0.2525543056 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", + "model":"deepseek\/deepseek-r1", + "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.5645550913, - "sentence_nr":2 + "score":0.4855834718 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"sw", + "task":"translation_to", "metric":"bleu", - "score":0.2140322213, - "sentence_nr":2 + "score":0.3353132654 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"sw", + "task":"translation_to", "metric":"chrf", - "score":0.5631214322, - "sentence_nr":2 + "score":0.5534047662 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"deepseek\/deepseek-r1", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.1891762066, - "sentence_nr":2 + "score":0.1505793252 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"deepseek\/deepseek-r1", + "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.4346170233, - "sentence_nr":2 + "score":0.269111455 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"te", + "task":"translation_to", "metric":"bleu", - "score":0.185053788, - "sentence_nr":2 + "score":0.1313190377 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"te", + "task":"translation_to", "metric":"chrf", - "score":0.4705108742, - "sentence_nr":2 + "score":0.3349177081 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"deepseek\/deepseek-r1", "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.0980716713, - "sentence_nr":2 + "score":0.1514267917 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"deepseek\/deepseek-r1", "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.4646043403, - "sentence_nr":2 + "score":0.3397549606 }, { - "model":"openai\/gpt-4.1-mini", + "model":"deepseek\/deepseek-r1", "bcp_47":"ur", - "task":"translation_from", + "task":"translation_to", "metric":"bleu", - "score":0.1724657814, - "sentence_nr":2 + "score":0.2593168504 }, { - "model":"openai\/gpt-4.1-mini", + "model":"deepseek\/deepseek-r1", "bcp_47":"ur", - "task":"translation_from", + "task":"translation_to", "metric":"chrf", - "score":0.4978075401, - "sentence_nr":2 + "score":0.4181171937 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", + "model":"deepseek\/deepseek-r1", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.4054983797, - "sentence_nr":2 + "score":0.1737123456 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", + "model":"deepseek\/deepseek-r1", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.6264774231, - "sentence_nr":2 + "score":0.3975781626 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"vi", + "task":"translation_to", "metric":"bleu", - "score":0.4204505079, - "sentence_nr":2 + "score":0.320003713 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"vi", + "task":"translation_to", "metric":"chrf", - "score":0.6503146347, - "sentence_nr":2 + "score":0.5179634386 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", + "model":"deepseek\/deepseek-r1", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"deepseek\/deepseek-r1", + "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.4387071211, - "sentence_nr":2 + "score":0.2147159409 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", + "model":"deepseek\/deepseek-r1", + "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.6525926696, - "sentence_nr":2 + "score":0.4884471405 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"zh", + "task":"translation_to", "metric":"bleu", - "score":0.420744549, - "sentence_nr":2 + "score":0.2856153111 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"deepseek\/deepseek-r1", + "bcp_47":"zh", + "task":"translation_to", "metric":"chrf", - "score":0.6496192656, - "sentence_nr":2 + "score":0.3570853581 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.4877513773, - "sentence_nr":2 + "score":0.2957143991 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.7197897787, - "sentence_nr":2 + "score":0.5733819398 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ar", + "task":"translation_to", "metric":"bleu", - "score":0.2005111976, - "sentence_nr":2 + "score":0.3975775226 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ar", + "task":"translation_to", "metric":"chrf", - "score":0.5334791309, - "sentence_nr":2 + "score":0.6026539032 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.2489407298, - "sentence_nr":2 + "score":0.2722037865 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"google\/gemini-2.0-flash-001", "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.5212235893, - "sentence_nr":2 + "score":0.5441644725 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"google\/gemini-2.0-flash-001", "bcp_47":"bn", - "task":"translation_from", + "task":"translation_to", "metric":"bleu", - "score":0.2372464203, - "sentence_nr":2 + "score":0.3756817753 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"google\/gemini-2.0-flash-001", "bcp_47":"bn", - "task":"translation_from", + "task":"translation_to", "metric":"chrf", - "score":0.5175129869, - "sentence_nr":2 + "score":0.5431366991 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.184941941, - "sentence_nr":2 + "score":0.3669235156 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.5067677917, - "sentence_nr":2 + "score":0.61602266 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"de", + "task":"translation_to", "metric":"bleu", - "score":0.3189223091, - "sentence_nr":2 + "score":0.515407684 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"de", + "task":"translation_to", "metric":"chrf", - "score":0.5875084576, - "sentence_nr":2 + "score":0.6945040285 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.353500237, - "sentence_nr":2 + "score":0.5394941139 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.5959879218, - "sentence_nr":2 + "score":0.7176459206 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"en", + "task":"translation_to", "metric":"bleu", - "score":0.3936136052, - "sentence_nr":2 + "score":0.6542806821 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"en", + "task":"translation_to", "metric":"chrf", - "score":0.6492198448, - "sentence_nr":2 + "score":0.8016677558 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.3936136052, - "sentence_nr":2 + "score":0.2647784787 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.6492198448, - "sentence_nr":2 + "score":0.534131581 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"es", + "task":"translation_to", "metric":"bleu", - "score":0.3833310864, - "sentence_nr":2 + "score":0.3885319246 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"es", + "task":"translation_to", "metric":"chrf", - "score":0.6252821653, - "sentence_nr":2 + "score":0.6122434715 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.3938668169, - "sentence_nr":2 + "score":0.3106669108 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.6503960274, - "sentence_nr":2 + "score":0.5636006618 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fr", + "task":"translation_to", "metric":"bleu", - "score":0.3598376609, - "sentence_nr":2 + "score":0.5258244924 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"fr", + "task":"translation_to", "metric":"chrf", - "score":0.5862251405, - "sentence_nr":2 + "score":0.7167464827 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.2114773474, - "sentence_nr":2 + "score":0.3579075772 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.4102017865, - "sentence_nr":2 + "score":0.6194831237 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"hi", + "task":"translation_to", "metric":"bleu", - "score":0.3563982586, - "sentence_nr":2 + "score":0.4158534882 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"hi", + "task":"translation_to", "metric":"chrf", - "score":0.5378970485, - "sentence_nr":2 + "score":0.6174987325 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.1510722413, - "sentence_nr":2 + "score":0.3245383993 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.4359232973, - "sentence_nr":2 + "score":0.5729744645 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"id", + "task":"translation_to", "metric":"bleu", - "score":0.3276244253, - "sentence_nr":2 + "score":0.4448839139 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"id", + "task":"translation_to", "metric":"chrf", - "score":0.5817308767, - "sentence_nr":2 + "score":0.6973440754 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.2971752224, - "sentence_nr":2 + "score":0.3117179672 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.6051336645, - "sentence_nr":2 + "score":0.5777870563 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ja", + "task":"translation_to", "metric":"bleu", - "score":0.2329856852, - "sentence_nr":2 + "score":0.3252873649 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ja", + "task":"translation_to", "metric":"chrf", - "score":0.5405751251, - "sentence_nr":2 + "score":0.4988074019 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.2563564295, - "sentence_nr":2 + "score":0.3569868465 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.5499025329, - "sentence_nr":2 + "score":0.5843991239 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"jv", + "task":"translation_to", "metric":"bleu", - "score":0.2500653935, - "sentence_nr":2 + "score":0.3135334271 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"jv", + "task":"translation_to", "metric":"chrf", - "score":0.5098952452, - "sentence_nr":2 + "score":0.5896292046 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.3410035629, - "sentence_nr":2 + "score":0.310376381 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.6673519559, - "sentence_nr":2 + "score":0.553246687 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"mr", + "task":"translation_to", "metric":"bleu", - "score":0.2786312784, - "sentence_nr":2 + "score":0.2835101619 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"mr", + "task":"translation_to", "metric":"chrf", - "score":0.4836796408, - "sentence_nr":2 + "score":0.4885179598 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.4175668624, - "sentence_nr":2 + "score":0.4330249307 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.5616829346, - "sentence_nr":2 + "score":0.6595328005 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.4205004826, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5674537639, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pa", + "task":"translation_to", "metric":"bleu", - "score":0.4097432382, - "sentence_nr":2 + "score":0.4034194489 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pa", + "task":"translation_to", "metric":"chrf", - "score":0.5368112087, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.380217695, - "sentence_nr":2 + "score":0.5814569981 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5452668935, - "sentence_nr":2 + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.7281051247, - "sentence_nr":3 + "score":0.3163929238 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.7882997401, - "sentence_nr":3 + "score":0.5723494086 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pt", + "task":"translation_to", "metric":"bleu", - "score":0.5806197937, - "sentence_nr":3 + "score":0.5307526172 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"pt", + "task":"translation_to", "metric":"chrf", - "score":0.7346706701, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.5793367581, - "sentence_nr":3 + "score":0.7110385531 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.6502428442, - "sentence_nr":3 + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.4855332614, - "sentence_nr":3 + "score":0.2574428009 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.5299556743, - "sentence_nr":3 + "score":0.5385430576 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ru", + "task":"translation_to", "metric":"bleu", - "score":0.5411953361, - "sentence_nr":3 + "score":0.4379543642 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ru", + "task":"translation_to", "metric":"chrf", - "score":0.6689891795, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2555219912, - "sentence_nr":3 + "score":0.6143170099 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3799133205, - "sentence_nr":3 + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.2338678621, - "sentence_nr":3 + "score":0.3703323281 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.3682311524, - "sentence_nr":3 + "score":0.5881678812 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sw", + "task":"translation_to", "metric":"bleu", - "score":0.1173952179, - "sentence_nr":3 + "score":0.5012096467 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"sw", + "task":"translation_to", "metric":"chrf", - "score":0.2209049178, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1892240569, - "sentence_nr":3 + "score":0.7067312972 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2804131085, - "sentence_nr":3 + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.0996020674, - "sentence_nr":3 + "score":0.3855742221 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.2144517459, - "sentence_nr":3 + "score":0.6089215443 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"te", + "task":"translation_to", "metric":"bleu", - "score":0.4093301993, - "sentence_nr":3 + "score":0.3338485428 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"te", + "task":"translation_to", "metric":"chrf", - "score":0.5127625182, - "sentence_nr":3 + "score":0.5599923303 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.6244631487, - "sentence_nr":3 + "score":0.256633436 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.6931369519, - "sentence_nr":3 + "score":0.5540218114 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ur", + "task":"translation_to", "metric":"bleu", - "score":0.5819726385, - "sentence_nr":3 + "score":0.283656908 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"ur", + "task":"translation_to", "metric":"chrf", - "score":0.6970914529, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4412006373, - "sentence_nr":3 + "score":0.4700660306 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5296624609, - "sentence_nr":3 + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.5411953361, - "sentence_nr":3 + "score":0.2924845131 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.6689891795, - "sentence_nr":3 + "score":0.5532241595 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"vi", + "task":"translation_to", "metric":"bleu", - "score":0.4577275269, - "sentence_nr":3 + "score":0.3842345819 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"vi", + "task":"translation_to", "metric":"chrf", - "score":0.6747054474, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2538333923, - "sentence_nr":3 + "score":0.6178494251 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4589637948, - "sentence_nr":3 + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.3508739524, - "sentence_nr":3 + "score":0.2857271778 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.5533976154, - "sentence_nr":3 + "score":0.5503996958 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"zh", + "task":"translation_to", "metric":"bleu", - "score":0.2370526644, - "sentence_nr":3 + "score":0.3778780802 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-001", + "bcp_47":"zh", + "task":"translation_to", "metric":"chrf", - "score":0.4471600746, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3315041466, - "sentence_nr":3 + "score":0.397093475 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5307991157, - "sentence_nr":3 + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.2766873691, - "sentence_nr":3 + "score":0.2261993605 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.4414406761, - "sentence_nr":3 + "score":0.4713910334 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"ar", - "task":"translation_from", + "task":"translation_to", "metric":"bleu", - "score":0.1720076757, - "sentence_nr":3 + "score":0.4047621232 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"ar", - "task":"translation_from", + "task":"translation_to", "metric":"chrf", - "score":0.3723150838, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2465659486, - "sentence_nr":3 + "score":0.6016984486 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.568906916, - "sentence_nr":3 + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":3 + "score":0.2193638362 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.3039115378, - "sentence_nr":3 + "score":0.4698224614 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"bn", + "task":"translation_to", "metric":"bleu", - "score":0.1548157555, - "sentence_nr":3 + "score":0.3331571997 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"bn", + "task":"translation_to", "metric":"chrf", - "score":0.3242496688, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.4751132439, - "sentence_nr":3 + "score":0.5230347118 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6159319815, - "sentence_nr":3 + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.1477219991, - "sentence_nr":3 + "score":0.2768085602 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.286852017, - "sentence_nr":3 + "score":0.4912101702 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"de", + "task":"translation_to", "metric":"bleu", - "score":0.1477219991, - "sentence_nr":3 + "score":0.5341715111 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"de", + "task":"translation_to", "metric":"chrf", - "score":0.2391308149, - "sentence_nr":3 + "score":0.7072193548 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.1818060822, - "sentence_nr":3 + "score":0.3830044788 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.2730775333, - "sentence_nr":3 + "score":0.5606920251 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"en", + "task":"translation_to", "metric":"bleu", - "score":0.1496597508, - "sentence_nr":3 + "score":0.5668030405 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"en", + "task":"translation_to", "metric":"chrf", - "score":0.2221350278, - "sentence_nr":3 + "score":0.7339158252 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.7281051247, - "sentence_nr":3 + "score":0.2943762224 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.7847983366, - "sentence_nr":3 + "score":0.5358537364 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"es", + "task":"translation_to", "metric":"bleu", - "score":0.3254455687, - "sentence_nr":3 + "score":0.3601264217 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"es", + "task":"translation_to", "metric":"chrf", - "score":0.4474512036, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.6230832294, - "sentence_nr":3 + "score":0.6055265571 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.70254087, - "sentence_nr":3 + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.3267294026, - "sentence_nr":3 + "score":0.2647971272 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.4510525483, - "sentence_nr":3 + "score":0.5503506292 }, { - "model":"openai\/gpt-4.1-mini", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"fr", - "task":"translation_from", + "task":"translation_to", "metric":"bleu", - "score":0.4855332614, - "sentence_nr":3 + "score":0.5019602858 }, { - "model":"openai\/gpt-4.1-mini", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"fr", - "task":"translation_from", + "task":"translation_to", "metric":"chrf", - "score":0.6448214025, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.4815092082, - "sentence_nr":3 + "score":0.6907968386 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5820265218, - "sentence_nr":3 + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.2388752792, - "sentence_nr":3 + "score":0.3907958067 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.4120359949, - "sentence_nr":3 + "score":0.6168614685 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"hi", + "task":"translation_to", "metric":"bleu", - "score":0.36210097, - "sentence_nr":3 + "score":0.4116631597 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"hi", + "task":"translation_to", "metric":"chrf", - "score":0.4080981511, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.316501463, - "sentence_nr":3 + "score":0.6260711406 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4251617362, - "sentence_nr":3 + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.3692377875, - "sentence_nr":3 + "score":0.2723472362 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.5093945383, - "sentence_nr":3 + "score":0.5512694018 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"id", + "task":"translation_to", "metric":"bleu", - "score":0.5804511284, - "sentence_nr":3 + "score":0.4033292298 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"id", + "task":"translation_to", "metric":"chrf", - "score":0.7246473808, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.5804511284, - "sentence_nr":3 + "score":0.6688453679 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.7282086346, - "sentence_nr":3 + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.5793367581, - "sentence_nr":3 + "score":0.2213115571 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.6502428442, - "sentence_nr":3 + "score":0.4716655163 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ja", + "task":"translation_to", "metric":"bleu", - "score":0.1243018504, - "sentence_nr":3 + "score":0.2097990462 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ja", + "task":"translation_to", "metric":"chrf", - "score":0.3295011624, - "sentence_nr":3 + "score":0.3915561417 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.5198707242, - "sentence_nr":3 + "score":0.3653472959 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.6498183531, - "sentence_nr":3 + "score":0.5797628494 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"jv", + "task":"translation_to", "metric":"bleu", - "score":0.8482942955, - "sentence_nr":3 + "score":0.3433849381 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"jv", + "task":"translation_to", "metric":"chrf", - "score":0.9256238041, - "sentence_nr":3 + "score":0.600500681 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":1.0, - "sentence_nr":3 + "score":0.2443836816 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":1.0, - "sentence_nr":3 + "score":0.4868851136 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"mr", + "task":"translation_to", "metric":"bleu", - "score":1.0, - "sentence_nr":3 + "score":0.2414882248 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"mr", + "task":"translation_to", "metric":"chrf", - "score":1.0, - "sentence_nr":3 + "score":0.4707414144 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":3 + "score":0.3529476629 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.0, - "sentence_nr":3 + "score":0.5689952282 }, { - "model":"openai\/gpt-4.1-mini", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"pa", - "task":"translation_from", + "task":"translation_to", "metric":"bleu", - "score":0.8482942955, - "sentence_nr":3 + "score":0.4285508909 }, { - "model":"openai\/gpt-4.1-mini", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"pa", - "task":"translation_from", + "task":"translation_to", "metric":"chrf", - "score":0.9256238041, - "sentence_nr":3 + "score":0.5918084941 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.4732072478, - "sentence_nr":3 + "score":0.311051651 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.5833006007, - "sentence_nr":3 + "score":0.5763190766 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"pt", + "task":"translation_to", "metric":"bleu", - "score":0.3556521384, - "sentence_nr":3 + "score":0.5012048785 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"pt", + "task":"translation_to", "metric":"chrf", - "score":0.5948308114, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.5406964704, - "sentence_nr":3 + "score":0.6909453526 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.596459533, - "sentence_nr":3 + "task":"mmlu", + "metric":"accuracy", + "score":0.8 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.2575863752, - "sentence_nr":3 + "score":0.2525201789 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.3717184744, - "sentence_nr":3 + "score":0.4998034041 }, { - "model":"openai\/gpt-4.1-mini", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"ru", - "task":"translation_from", + "task":"translation_to", "metric":"bleu", - "score":0.1358581334, - "sentence_nr":3 + "score":0.3876399108 }, { - "model":"openai\/gpt-4.1-mini", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"ru", - "task":"translation_from", + "task":"translation_to", "metric":"chrf", - "score":0.3021348975, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0893927012, - "sentence_nr":3 + "score":0.5526901501 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2952752522, - "sentence_nr":3 + "task":"mmlu", + "metric":"accuracy", + "score":0.8 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.216291148, - "sentence_nr":3 + "score":0.2544576251 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.3542320138, - "sentence_nr":3 + "score":0.510033557 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"sw", - "task":"translation_from", + "task":"translation_to", "metric":"bleu", - "score":0.2199335663, - "sentence_nr":3 + "score":0.463366902 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"sw", - "task":"translation_from", + "task":"translation_to", "metric":"chrf", - "score":0.3822901361, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1221286555, - "sentence_nr":3 + "score":0.6862513407 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.276049295, - "sentence_nr":3 + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.1580460695, - "sentence_nr":3 + "score":0.2891932187 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.2486403592, - "sentence_nr":3 + "score":0.5401801911 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"te", + "task":"translation_to", "metric":"bleu", - "score":1.0, - "sentence_nr":4 + "score":0.2956394846 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"te", + "task":"translation_to", "metric":"chrf", - "score":1.0, - "sentence_nr":4 + "score":0.5301794135 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":1.0, - "sentence_nr":4 + "score":0.2772013738 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":1.0, - "sentence_nr":4 + "score":0.5352561426 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ur", + "task":"translation_to", "metric":"bleu", - "score":1.0, - "sentence_nr":4 + "score":0.3143344562 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"ur", + "task":"translation_to", "metric":"chrf", - "score":1.0, - "sentence_nr":4 + "score":0.5013762031 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.2023911962 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.2246029758, - "sentence_nr":4 + "score":0.4478296607 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"vi", + "task":"translation_to", "metric":"bleu", - "score":1.0, - "sentence_nr":4 + "score":0.3591790299 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", + "model":"google\/gemini-2.0-flash-lite-001", + "bcp_47":"vi", + "task":"translation_to", "metric":"chrf", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.5997773195 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6290393497, - "sentence_nr":4 + "task":"mmlu", + "metric":"accuracy", + "score":0.8 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.2384160236 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.6290393497, - "sentence_nr":4 + "score":0.490052749 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"zh", - "task":"translation_from", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.2454938644 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"google\/gemini-2.0-flash-lite-001", "bcp_47":"zh", - "task":"translation_from", + "task":"translation_to", "metric":"chrf", - "score":0.6290393497, - "sentence_nr":4 + "score":0.2975998115 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.3372721649 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.5581982021, - "sentence_nr":4 + "score":0.5838783957 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ar", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.4321344547 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ar", + "task":"translation_to", "metric":"chrf", - "score":0.6290393497, - "sentence_nr":4 + "score":0.6264247806 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.2938960839 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.4379538199, - "sentence_nr":4 + "score":0.5517113066 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"bn", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.3782283657 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"bn", + "task":"translation_to", "metric":"chrf", - "score":0.5881561249, - "sentence_nr":4 + "score":0.5487977464 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.3186073711 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.4667095722, - "sentence_nr":4 + "score":0.5411120296 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"de", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.5051785366 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"de", + "task":"translation_to", "metric":"chrf", - "score":0.3754432474, - "sentence_nr":4 + "score":0.6920207566 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.4956880203 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.5293274846, - "sentence_nr":4 + "score":0.6377883658 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"en", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.6849600072 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"en", + "task":"translation_to", "metric":"chrf", - "score":0.4121323135, - "sentence_nr":4 + "score":0.836046383 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.2675890166 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.4043598708, - "sentence_nr":4 + "score":0.5349872169 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"es", - "task":"translation_from", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.4090938759 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"es", - "task":"translation_from", + "task":"translation_to", "metric":"chrf", - "score":0.3425668387, - "sentence_nr":4 + "score":0.6229850426 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.3316785101 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.4147702817, - "sentence_nr":4 + "score":0.5862021915 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fr", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.5917547348 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"fr", + "task":"translation_to", "metric":"chrf", - "score":0.4043598708, - "sentence_nr":4 + "score":0.7493377856 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.4181179966 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.396188029, - "sentence_nr":4 + "score":0.6225342018 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"hi", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.4326454895 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"hi", + "task":"translation_to", "metric":"chrf", - "score":0.3985861327, - "sentence_nr":4 + "score":0.6447613926 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.3651687929 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.3818534927, - "sentence_nr":4 + "score":0.5938680131 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"id", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.3831360784 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"id", + "task":"translation_to", "metric":"chrf", - "score":0.364411248, - "sentence_nr":4 + "score":0.6646674328 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.3772905023 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.3898236605, - "sentence_nr":4 + "score":0.5716747693 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ja", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.4648684731 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ja", + "task":"translation_to", "metric":"chrf", - "score":0.5042211795, - "sentence_nr":4 + "score":0.5702790562 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.4284391483 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.4425973012, - "sentence_nr":4 + "score":0.6436107817 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"jv", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.3533000629 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"jv", + "task":"translation_to", "metric":"chrf", - "score":0.5118761227, - "sentence_nr":4 + "score":0.6161033443 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.2317334189 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.5118761227, - "sentence_nr":4 + "score":0.5101013277 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"mr", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.2648144898 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"mr", + "task":"translation_to", "metric":"chrf", - "score":0.5582360999, - "sentence_nr":4 + "score":0.4919964495 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.4595839503 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.5516607623, - "sentence_nr":4 + "score":0.678498887 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pa", + "task":"translation_to", + "metric":"bleu", + "score":0.478748482 + }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pa", + "task":"translation_to", "metric":"chrf", - "score":0.4716061611, - "sentence_nr":4 + "score":0.6196055546 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.3741937374 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.5256353513, - "sentence_nr":4 + "score":0.6015951936 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pt", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.5289737883 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"pt", + "task":"translation_to", "metric":"chrf", - "score":0.3765697091, - "sentence_nr":4 + "score":0.7055677715 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.2534743707, - "sentence_nr":4 + "score":0.2597045639 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.5971149415, - "sentence_nr":4 + "score":0.5415502492 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ru", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.5240240402 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ru", + "task":"translation_to", "metric":"chrf", - "score":0.4576529536, - "sentence_nr":4 + "score":0.677637684 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.3411098531 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.5309982647, - "sentence_nr":4 + "score":0.5298146709 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sw", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.479199485 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"sw", + "task":"translation_to", "metric":"chrf", - "score":0.4726395749, - "sentence_nr":4 + "score":0.6917999035 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.4076773709 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.4005242819, - "sentence_nr":4 + "score":0.6331898021 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"te", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.3546746435 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"te", + "task":"translation_to", "metric":"chrf", - "score":0.4214137028, - "sentence_nr":4 + "score":0.5752621807 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.2460137258, - "sentence_nr":4 + "score":0.3221779371 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.6374693501, - "sentence_nr":4 + "score":0.5831693751 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ur", + "task":"translation_to", "metric":"bleu", - "score":0.1892240569, - "sentence_nr":4 + "score":0.2652097773 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"ur", + "task":"translation_to", "metric":"chrf", - "score":0.6151179643, - "sentence_nr":4 + "score":0.4365593229 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.2460137258, - "sentence_nr":4 + "score":0.3357390025 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.6869474337, - "sentence_nr":4 + "score":0.5736288237 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"vi", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.4227150213 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"vi", + "task":"translation_to", "metric":"chrf", - "score":0.4746119151, - "sentence_nr":4 + "score":0.6237856247 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.2672185947 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.5833743057, - "sentence_nr":4 + "score":0.5405753178 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"zh", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.3184157374 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", + "model":"google\/gemini-2.5-flash-preview", + "bcp_47":"zh", + "task":"translation_to", "metric":"chrf", - "score":0.4642659596, - "sentence_nr":4 + "score":0.3790142738 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", + "model":"google\/gemini-flash-1.5", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.2627473985 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", + "model":"google\/gemini-flash-1.5", + "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.4123810027, - "sentence_nr":4 + "score":0.5441433858 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"ar", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.2905461034 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"ar", + "task":"translation_to", "metric":"chrf", - "score":0.4123810027, - "sentence_nr":4 + "score":0.533714307 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", + "model":"google\/gemini-flash-1.5", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.2482076583 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", + "model":"google\/gemini-flash-1.5", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.4806367958, - "sentence_nr":4 + "score":0.5203197505 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"bn", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.2943876522 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"bn", + "task":"translation_to", "metric":"chrf", - "score":0.4326969206, - "sentence_nr":4 + "score":0.5061827933 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", + "model":"google\/gemini-flash-1.5", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.2926727761 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", + "model":"google\/gemini-flash-1.5", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.4108469458, - "sentence_nr":4 + "score":0.5382695102 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"de", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.4992927063 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"de", + "task":"translation_to", "metric":"chrf", - "score":0.3990998963, - "sentence_nr":4 + "score":0.68458461 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", + "model":"google\/gemini-flash-1.5", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.3544545007 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", + "model":"google\/gemini-flash-1.5", + "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.3991370902, - "sentence_nr":4 + "score":0.6065493785 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"en", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.4605012594 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"en", + "task":"translation_to", "metric":"chrf", - "score":0.4044335714, - "sentence_nr":4 + "score":0.7071085486 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", + "model":"google\/gemini-flash-1.5", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.3062605383 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", + "model":"google\/gemini-flash-1.5", + "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.3990998963, - "sentence_nr":4 + "score":0.5185293421 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"es", + "task":"translation_to", "metric":"bleu", - "score":0.3113878808, - "sentence_nr":4 + "score":0.3509297564 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"es", + "task":"translation_to", "metric":"chrf", - "score":0.6758978745, - "sentence_nr":4 + "score":0.5918368155 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", + "model":"google\/gemini-flash-1.5", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.1718152967, - "sentence_nr":4 + "score":0.2672257271 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", + "model":"google\/gemini-flash-1.5", + "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.5293474686, - "sentence_nr":4 + "score":0.5461942844 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"fr", + "task":"translation_to", "metric":"bleu", - "score":0.2357831604, - "sentence_nr":4 + "score":0.5445047026 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"fr", + "task":"translation_to", "metric":"chrf", - "score":0.5821373704, - "sentence_nr":4 + "score":0.7187017022 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", + "model":"google\/gemini-flash-1.5", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.1452867953, - "sentence_nr":4 + "score":0.3658457853 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", + "model":"google\/gemini-flash-1.5", + "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.5149523169, - "sentence_nr":4 + "score":0.6104356234 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"hi", + "task":"translation_to", "metric":"bleu", - "score":0.2289415686, - "sentence_nr":4 + "score":0.3523205262 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"hi", + "task":"translation_to", "metric":"chrf", - "score":0.6314372537, - "sentence_nr":4 + "score":0.5683614987 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", + "model":"google\/gemini-flash-1.5", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.2887138087, - "sentence_nr":5 + "score":0.3445897108 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", + "model":"google\/gemini-flash-1.5", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.6342291346, - "sentence_nr":5 + "score":0.5707894245 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"id", + "task":"translation_to", "metric":"bleu", - "score":1.0, - "sentence_nr":5 + "score":0.3561921353 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"id", + "task":"translation_to", "metric":"chrf", - "score":1.0, - "sentence_nr":5 + "score":0.6497121165 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", + "model":"google\/gemini-flash-1.5", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.7013062757, - "sentence_nr":5 + "score":0.3395831717 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", + "model":"google\/gemini-flash-1.5", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.9303769449, - "sentence_nr":5 + "score":0.6027437002 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"ja", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":5 + "score":0.4020848766 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"ja", + "task":"translation_to", "metric":"chrf", - "score":0.23816585, - "sentence_nr":5 + "score":0.4849709417 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", + "model":"google\/gemini-flash-1.5", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":1.0, - "sentence_nr":5 + "score":0.3178340836 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", + "model":"google\/gemini-flash-1.5", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":1.0, - "sentence_nr":5 + "score":0.5358308503 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"jv", + "task":"translation_to", "metric":"bleu", - "score":0.508747354, - "sentence_nr":5 + "score":0.2594137172 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"jv", + "task":"translation_to", "metric":"chrf", - "score":0.7647955332, - "sentence_nr":5 + "score":0.5439108225 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", + "model":"google\/gemini-flash-1.5", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.508747354, - "sentence_nr":5 + "score":0.231055869 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", + "model":"google\/gemini-flash-1.5", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.7647955332, - "sentence_nr":5 + "score":0.4704905603 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"mr", + "task":"translation_to", "metric":"bleu", - "score":0.508747354, - "sentence_nr":5 + "score":0.2167113972 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"mr", + "task":"translation_to", "metric":"chrf", - "score":0.7647955332, - "sentence_nr":5 + "score":0.446095738 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"google\/gemini-flash-1.5", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.4741000223, - "sentence_nr":5 + "score":0.4063183084 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"google\/gemini-flash-1.5", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.7538467008, - "sentence_nr":5 + "score":0.6360820916 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"pa", + "task":"translation_to", "metric":"bleu", - "score":0.5738396575, - "sentence_nr":5 + "score":0.4147226756 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"pa", + "task":"translation_to", "metric":"chrf", - "score":0.7983571334, - "sentence_nr":5 + "score":0.5528779397 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", + "model":"google\/gemini-flash-1.5", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.4818114945, - "sentence_nr":5 + "score":0.3026809635 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", + "model":"google\/gemini-flash-1.5", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.7675828789, - "sentence_nr":5 + "score":0.5703886674 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"pt", + "task":"translation_to", "metric":"bleu", - "score":0.5091224919, - "sentence_nr":5 + "score":0.4781663764 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"pt", + "task":"translation_to", "metric":"chrf", - "score":0.7829685247, - "sentence_nr":5 + "score":0.6799080797 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", + "model":"google\/gemini-flash-1.5", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.5091224919, - "sentence_nr":5 + "score":0.2557079153 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", + "model":"google\/gemini-flash-1.5", + "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.7829685247, - "sentence_nr":5 + "score":0.5311675905 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"ru", + "task":"translation_to", "metric":"bleu", - "score":0.6626129614, - "sentence_nr":5 + "score":0.3835973558 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"ru", + "task":"translation_to", "metric":"chrf", - "score":0.8597893118, - "sentence_nr":5 + "score":0.5821962599 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"google\/gemini-flash-1.5", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.4818114945, - "sentence_nr":5 + "score":0.2577141288 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"google\/gemini-flash-1.5", + "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.7675828789, - "sentence_nr":5 + "score":0.5044946448 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"sw", + "task":"translation_to", "metric":"bleu", - "score":0.4047272002, - "sentence_nr":5 + "score":0.359025417 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"sw", + "task":"translation_to", "metric":"chrf", - "score":0.6681898018, - "sentence_nr":5 + "score":0.6186979309 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", + "model":"google\/gemini-flash-1.5", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.4027672046, - "sentence_nr":5 + "score":0.2906881879 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", + "model":"google\/gemini-flash-1.5", + "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.6529271691, - "sentence_nr":5 + "score":0.5350481537 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"te", + "task":"translation_to", "metric":"bleu", - "score":0.4047272002, - "sentence_nr":5 + "score":0.236600544 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"te", + "task":"translation_to", "metric":"chrf", - "score":0.6681898018, - "sentence_nr":5 + "score":0.4972520076 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", + "model":"google\/gemini-flash-1.5", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.4047272002, - "sentence_nr":5 + "score":0.2771747402 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", + "model":"google\/gemini-flash-1.5", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.6681898018, - "sentence_nr":5 + "score":0.5443382904 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"ur", + "task":"translation_to", "metric":"bleu", - "score":0.4489771072, - "sentence_nr":5 + "score":0.1736835138 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"ur", + "task":"translation_to", "metric":"chrf", - "score":0.686224909, - "sentence_nr":5 + "score":0.3883707647 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", + "model":"google\/gemini-flash-1.5", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.5379348325, - "sentence_nr":5 + "score":0.2410514007 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", + "model":"google\/gemini-flash-1.5", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.770376611, - "sentence_nr":5 + "score":0.4876248025 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"vi", + "task":"translation_to", "metric":"bleu", - "score":0.3018835387, - "sentence_nr":5 + "score":0.3887220068 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"vi", + "task":"translation_to", "metric":"chrf", - "score":0.6086565368, - "sentence_nr":5 + "score":0.6136859301 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", + "model":"google\/gemini-flash-1.5", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.2239152297, - "sentence_nr":5 + "score":0.2111467812 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", + "model":"google\/gemini-flash-1.5", + "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.6087618281, - "sentence_nr":5 + "score":0.4809814755 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"zh", + "task":"translation_to", "metric":"bleu", - "score":0.2704091954, - "sentence_nr":5 + "score":0.2521327553 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"google\/gemini-flash-1.5", + "bcp_47":"zh", + "task":"translation_to", "metric":"chrf", - "score":0.6207272323, - "sentence_nr":5 + "score":0.3112350874 }, { - "model":"openai\/gpt-4.1-mini", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.2704091954, - "sentence_nr":5 + "score":0.2467308763 }, { - "model":"openai\/gpt-4.1-mini", + "model":"google\/gemini-flash-1.5-8b", "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.6207272323, - "sentence_nr":5 + "score":0.534220382 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ar", + "task":"translation_to", "metric":"bleu", - "score":0.5091224919, - "sentence_nr":5 + "score":0.2743392971 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ar", + "task":"translation_to", "metric":"chrf", - "score":0.7829685247, - "sentence_nr":5 + "score":0.5037551764 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.6026286935, - "sentence_nr":5 + "score":0.1944999711 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.8025775976, - "sentence_nr":5 + "score":0.4268510127 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bn", + "task":"translation_to", "metric":"bleu", - "score":0.6626129614, - "sentence_nr":5 + "score":0.259115468 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bn", + "task":"translation_to", "metric":"chrf", - "score":0.8597893118, - "sentence_nr":5 + "score":0.494497039 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.6626129614, - "sentence_nr":5 + "score":0.2829478955 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.8597893118, - "sentence_nr":5 + "score":0.4871806301 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"de", + "task":"translation_to", "metric":"bleu", - "score":0.4818114945, - "sentence_nr":5 + "score":0.4110829383 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"de", + "task":"translation_to", "metric":"chrf", - "score":0.7675828789, - "sentence_nr":5 + "score":0.6232948404 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.589661355, - "sentence_nr":5 + "score":0.3785767671 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.752891475, - "sentence_nr":5 + "score":0.609933858 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"en", + "task":"translation_to", "metric":"bleu", - "score":0.4596980088, - "sentence_nr":5 + "score":0.51911398 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"en", + "task":"translation_to", "metric":"chrf", - "score":0.713787746, - "sentence_nr":5 + "score":0.7392276316 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.5300714513, - "sentence_nr":5 + "score":0.237555247 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.7461630751, - "sentence_nr":5 + "score":0.4538651122 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"es", + "task":"translation_to", "metric":"bleu", - "score":0.4596980088, - "sentence_nr":5 + "score":0.3655739185 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"es", + "task":"translation_to", "metric":"chrf", - "score":0.713787746, - "sentence_nr":5 + "score":0.6222977455 }, { - "model":"openai\/gpt-4.1-mini", + "model":"google\/gemini-flash-1.5-8b", "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4596980088, - "sentence_nr":5 + "task":"mmlu", + "metric":"accuracy", + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", + "model":"google\/gemini-flash-1.5-8b", "bcp_47":"fr", "task":"translation_from", - "metric":"chrf", - "score":0.713787746, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", "metric":"bleu", - "score":0.4801289745, - "sentence_nr":5 + "score":0.2666374602 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.6766690087, - "sentence_nr":5 + "score":0.499416925 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fr", + "task":"translation_to", "metric":"bleu", - "score":0.3272712268, - "sentence_nr":5 + "score":0.4596821942 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fr", + "task":"translation_to", "metric":"chrf", - "score":0.6272846474, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3272712268, - "sentence_nr":5 + "score":0.6596069595 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.6272846474, - "sentence_nr":5 + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.3042148589, - "sentence_nr":5 + "score":0.243987548 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.5662363924, - "sentence_nr":5 + "score":0.4795583662 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hi", + "task":"translation_to", "metric":"bleu", - "score":0.3207873973, - "sentence_nr":5 + "score":0.3694040944 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hi", + "task":"translation_to", "metric":"chrf", - "score":0.5817366082, - "sentence_nr":5 + "score":0.5844559185 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.2848931828, - "sentence_nr":5 + "score":0.2068662913 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.576432511, - "sentence_nr":5 + "score":0.4574195897 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"id", + "task":"translation_to", "metric":"bleu", - "score":0.2981792161, - "sentence_nr":5 + "score":0.3502935028 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"id", + "task":"translation_to", "metric":"chrf", - "score":0.5788026001, - "sentence_nr":5 + "score":0.6435312578 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.3942058093, - "sentence_nr":5 + "score":0.2621288101 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.5878575558, - "sentence_nr":5 + "score":0.5227903424 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ja", + "task":"translation_to", "metric":"bleu", - "score":0.2981792161, - "sentence_nr":5 + "score":0.3001729338 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ja", + "task":"translation_to", "metric":"chrf", - "score":0.5788026001, - "sentence_nr":5 + "score":0.4543813968 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.3485799123, - "sentence_nr":5 + "score":0.2413161859 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.6090575372, - "sentence_nr":5 + "score":0.4889410755 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"jv", + "task":"translation_to", "metric":"bleu", - "score":0.6471892368, - "sentence_nr":5 + "score":0.2769851422 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"jv", + "task":"translation_to", "metric":"chrf", - "score":0.8142499722, - "sentence_nr":5 + "score":0.5709543626 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.7012294788, - "sentence_nr":5 + "score":0.1815113298 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.847811572, - "sentence_nr":5 + "score":0.4391057397 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mr", + "task":"translation_to", "metric":"bleu", - "score":0.691790174, - "sentence_nr":5 + "score":0.2353762412 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mr", + "task":"translation_to", "metric":"chrf", - "score":0.8479928839, - "sentence_nr":5 + "score":0.4455494128 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"google\/gemini-flash-1.5-8b", "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.4020247735, - "sentence_nr":5 + "score":0.3485084476 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"google\/gemini-flash-1.5-8b", "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.7469480084, - "sentence_nr":5 + "score":0.5939961743 }, { - "model":"openai\/gpt-4.1-mini", + "model":"google\/gemini-flash-1.5-8b", "bcp_47":"pa", - "task":"translation_from", + "task":"translation_to", "metric":"bleu", - "score":0.5091224919, - "sentence_nr":5 + "score":0.4125142357 }, { - "model":"openai\/gpt-4.1-mini", + "model":"google\/gemini-flash-1.5-8b", "bcp_47":"pa", - "task":"translation_from", + "task":"translation_to", "metric":"chrf", - "score":0.7829685247, - "sentence_nr":5 + "score":0.5513553952 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.2371332025, - "sentence_nr":5 + "score":0.2628896238 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.610684297, - "sentence_nr":5 + "score":0.5183595448 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pt", + "task":"translation_to", "metric":"bleu", - "score":0.2169036581, - "sentence_nr":5 + "score":0.4596356921 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pt", + "task":"translation_to", "metric":"chrf", - "score":0.5384773679, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2311466382, - "sentence_nr":5 + "score":0.6605740155 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"google\/gemini-flash-1.5-8b", "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5786592585, - "sentence_nr":5 + "task":"mmlu", + "metric":"accuracy", + "score":0.8 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"google\/gemini-flash-1.5-8b", "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.2212877653, - "sentence_nr":5 + "score":0.182466759 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"google\/gemini-flash-1.5-8b", "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.560943925, - "sentence_nr":5 + "score":0.4404528166 }, { - "model":"openai\/gpt-4.1-mini", + "model":"google\/gemini-flash-1.5-8b", "bcp_47":"ru", - "task":"translation_from", + "task":"translation_to", "metric":"bleu", - "score":0.2212877653, - "sentence_nr":5 + "score":0.3555783157 }, { - "model":"openai\/gpt-4.1-mini", + "model":"google\/gemini-flash-1.5-8b", "bcp_47":"ru", - "task":"translation_from", + "task":"translation_to", "metric":"chrf", - "score":0.572263303, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.6888365053, - "sentence_nr":5 + "score":0.5498712278 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"google\/gemini-flash-1.5-8b", "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.8656273481, - "sentence_nr":5 + "task":"mmlu", + "metric":"accuracy", + "score":0.8 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"google\/gemini-flash-1.5-8b", "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.2571138654, - "sentence_nr":5 + "score":0.2359761779 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"google\/gemini-flash-1.5-8b", "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.6088853752, - "sentence_nr":5 + "score":0.4965595451 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"google\/gemini-flash-1.5-8b", "bcp_47":"sw", - "task":"translation_from", + "task":"translation_to", "metric":"bleu", - "score":0.2571138654, - "sentence_nr":5 + "score":0.2850822623 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"google\/gemini-flash-1.5-8b", "bcp_47":"sw", - "task":"translation_from", + "task":"translation_to", "metric":"chrf", - "score":0.6088853752, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3416581331, - "sentence_nr":5 + "score":0.5802793004 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6578570934, - "sentence_nr":5 + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.3060368951, - "sentence_nr":5 + "score":0.2700708569 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.6736142285, - "sentence_nr":5 + "score":0.5216974993 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"te", + "task":"translation_to", "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 + "score":0.2200201561 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"te", + "task":"translation_to", "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 + "score":0.4752363489 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":1.0, - "sentence_nr":6 + "score":0.2468482501 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":1.0, - "sentence_nr":6 + "score":0.5030755763 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ur", + "task":"translation_to", "metric":"bleu", - "score":1.0, - "sentence_nr":6 + "score":0.2478229019 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ur", + "task":"translation_to", "metric":"chrf", - "score":1.0, - "sentence_nr":6 + "score":0.4152088296 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":6 + "score":0.1594908644 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.3263040637, - "sentence_nr":6 + "score":0.3987254781 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"vi", + "task":"translation_to", "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 + "score":0.3413161409 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"vi", + "task":"translation_to", "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 + "score":0.6036920979 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.339038739, - "sentence_nr":6 + "score":0.2452562567 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"google\/gemini-flash-1.5-8b", "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.6170420597, - "sentence_nr":6 + "score":0.4947687861 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"google\/gemini-flash-1.5-8b", "bcp_47":"zh", - "task":"translation_from", + "task":"translation_to", "metric":"bleu", - "score":0.3142665434, - "sentence_nr":6 + "score":0.2210892317 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"google\/gemini-flash-1.5-8b", "bcp_47":"zh", - "task":"translation_from", + "task":"translation_to", "metric":"chrf", - "score":0.6466526067, - "sentence_nr":6 + "score":0.2889702622 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", + "model":"google\/gemma-3-27b-it", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.3751840463, - "sentence_nr":6 + "score":0.2378760525 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", + "model":"google\/gemma-3-27b-it", + "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.6279894553, - "sentence_nr":6 + "score":0.5183150258 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"ar", + "task":"translation_to", "metric":"bleu", - "score":0.1926847964, - "sentence_nr":6 + "score":0.3230924319 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"ar", + "task":"translation_to", "metric":"chrf", - "score":0.5513970749, - "sentence_nr":6 + "score":0.5538406612 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", + "model":"google\/gemma-3-27b-it", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.1946452196, - "sentence_nr":6 + "score":0.261796363 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", + "model":"google\/gemma-3-27b-it", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.5838790967, - "sentence_nr":6 + "score":0.5061044452 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"bn", + "task":"translation_to", "metric":"bleu", - "score":0.5014756678, - "sentence_nr":6 + "score":0.3392340733 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"bn", + "task":"translation_to", "metric":"chrf", - "score":0.7958858212, - "sentence_nr":6 + "score":0.527149208 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", + "model":"google\/gemma-3-27b-it", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.6255340042, - "sentence_nr":6 + "score":0.3574957943 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", + "model":"google\/gemma-3-27b-it", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.8724783049, - "sentence_nr":6 + "score":0.5949602318 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"de", + "task":"translation_to", "metric":"bleu", - "score":0.5014756678, - "sentence_nr":6 + "score":0.5362416556 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"de", + "task":"translation_to", "metric":"chrf", - "score":0.7958858212, - "sentence_nr":6 + "score":0.7003378351 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", + "model":"google\/gemma-3-27b-it", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.3083012996, - "sentence_nr":6 + "score":0.4224513828 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", + "model":"google\/gemma-3-27b-it", + "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.658937639, - "sentence_nr":6 + "score":0.6281695357 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"en", + "task":"translation_to", "metric":"bleu", - "score":0.4302123694, - "sentence_nr":6 + "score":0.5351379766 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"en", + "task":"translation_to", "metric":"chrf", - "score":0.7142896582, - "sentence_nr":6 + "score":0.7598417142 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"google\/gemma-3-27b-it", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemma-3-27b-it", "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.4899456142, - "sentence_nr":6 + "score":0.279398514 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"google\/gemma-3-27b-it", "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.7411155087, - "sentence_nr":6 + "score":0.5677163743 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"google\/gemma-3-27b-it", "bcp_47":"es", - "task":"translation_from", + "task":"translation_to", "metric":"bleu", - "score":0.4899456142, - "sentence_nr":6 + "score":0.3796449789 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"google\/gemma-3-27b-it", "bcp_47":"es", - "task":"translation_from", + "task":"translation_to", "metric":"chrf", - "score":0.7411155087, - "sentence_nr":6 + "score":0.6098050112 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", + "model":"google\/gemma-3-27b-it", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.3236579503, - "sentence_nr":6 + "score":0.2586433932 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", + "model":"google\/gemma-3-27b-it", + "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.6509517796, - "sentence_nr":6 + "score":0.5545655476 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"fr", + "task":"translation_to", "metric":"bleu", - "score":0.3236579503, - "sentence_nr":6 + "score":0.5217173445 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"fr", + "task":"translation_to", "metric":"chrf", - "score":0.6509517796, - "sentence_nr":6 + "score":0.706560562 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", + "model":"google\/gemma-3-27b-it", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.3236579503, - "sentence_nr":6 + "score":0.3147708697 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", + "model":"google\/gemma-3-27b-it", + "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.6509517796, - "sentence_nr":6 + "score":0.5735957081 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"hi", + "task":"translation_to", "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 + "score":0.3839899572 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"hi", + "task":"translation_to", "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 + "score":0.6091652356 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", + "model":"google\/gemma-3-27b-it", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 + "score":0.2843117161 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", + "model":"google\/gemma-3-27b-it", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 + "score":0.5625584849 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"id", + "task":"translation_to", "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 + "score":0.3330091043 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"id", + "task":"translation_to", "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 + "score":0.6452178521 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", + "model":"google\/gemma-3-27b-it", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 + "score":0.2694680234 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", + "model":"google\/gemma-3-27b-it", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 + "score":0.534930693 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"ja", + "task":"translation_to", "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 + "score":0.2886629345 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"ja", + "task":"translation_to", "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 + "score":0.4441001762 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", + "model":"google\/gemma-3-27b-it", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.4101479465, - "sentence_nr":6 + "score":0.2889499493 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", + "model":"google\/gemma-3-27b-it", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.7041976254, - "sentence_nr":6 + "score":0.4946977693 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"jv", + "task":"translation_to", "metric":"bleu", - "score":0.4547900039, - "sentence_nr":6 + "score":0.2708892281 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"jv", + "task":"translation_to", "metric":"chrf", - "score":0.6541971429, - "sentence_nr":6 + "score":0.5462808569 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", + "model":"google\/gemma-3-27b-it", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.2919394074, - "sentence_nr":6 + "score":0.2909291965 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", + "model":"google\/gemma-3-27b-it", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.5957961315, - "sentence_nr":6 + "score":0.5445276883 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"mr", + "task":"translation_to", "metric":"bleu", - "score":0.1753767087, - "sentence_nr":6 + "score":0.2268785589 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"mr", + "task":"translation_to", "metric":"chrf", - "score":0.480088967, - "sentence_nr":6 + "score":0.4679091917 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", + "model":"google\/gemma-3-27b-it", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.33828653, - "sentence_nr":6 + "score":0.4076785456 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", + "model":"google\/gemma-3-27b-it", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.6408187444, - "sentence_nr":6 + "score":0.6390667798 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"pa", + "task":"translation_to", "metric":"bleu", - "score":0.428494509, - "sentence_nr":6 + "score":0.4008672864 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"pa", + "task":"translation_to", "metric":"chrf", - "score":0.716402644, - "sentence_nr":6 + "score":0.5746982049 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", + "model":"google\/gemma-3-27b-it", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 + "score":0.28456543 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", + "model":"google\/gemma-3-27b-it", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 + "score":0.5644895825 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"pt", + "task":"translation_to", "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 + "score":0.5029529971 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"pt", + "task":"translation_to", "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 + "score":0.7001896317 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", + "model":"google\/gemma-3-27b-it", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 + "score":0.2624491573 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", + "model":"google\/gemma-3-27b-it", + "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 + "score":0.5200383542 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"ru", + "task":"translation_to", "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 + "score":0.5021166201 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"ru", + "task":"translation_to", "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 + "score":0.6735886 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", + "model":"google\/gemma-3-27b-it", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.5950922113, - "sentence_nr":6 + "score":0.2077591586 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", + "model":"google\/gemma-3-27b-it", + "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.7971172821, - "sentence_nr":6 + "score":0.484103396 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"sw", + "task":"translation_to", "metric":"bleu", - "score":0.483123361, - "sentence_nr":6 + "score":0.3186094389 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"sw", + "task":"translation_to", "metric":"chrf", - "score":0.7122562458, - "sentence_nr":6 + "score":0.6101838123 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", + "model":"google\/gemma-3-27b-it", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.483123361, - "sentence_nr":6 + "score":0.2690763704 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", + "model":"google\/gemma-3-27b-it", + "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.7122562458, - "sentence_nr":6 + "score":0.5194720687 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"te", + "task":"translation_to", "metric":"bleu", - "score":0.4207937381, - "sentence_nr":6 + "score":0.2606721725 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"te", + "task":"translation_to", "metric":"chrf", - "score":0.6985308026, - "sentence_nr":6 + "score":0.4856589279 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", + "model":"google\/gemma-3-27b-it", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.6511582134, - "sentence_nr":6 + "score":0.2738179594 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", + "model":"google\/gemma-3-27b-it", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.8600023705, - "sentence_nr":6 + "score":0.5231933041 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"ur", + "task":"translation_to", "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 + "score":0.2402519591 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"ur", + "task":"translation_to", "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 + "score":0.4398186462 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", + "model":"google\/gemma-3-27b-it", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.3226386416, - "sentence_nr":6 + "score":0.2009145559 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", + "model":"google\/gemma-3-27b-it", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.6824395077, - "sentence_nr":6 + "score":0.4683501544 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"vi", + "task":"translation_to", "metric":"bleu", - "score":0.4896430867, - "sentence_nr":6 + "score":0.3564695765 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"vi", + "task":"translation_to", "metric":"chrf", - "score":0.7719180937, - "sentence_nr":6 + "score":0.6122018967 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", + "model":"google\/gemma-3-27b-it", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.3236579503, - "sentence_nr":6 + "score":0.1887088881 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", + "model":"google\/gemma-3-27b-it", + "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.6590438072, - "sentence_nr":6 + "score":0.4674871904 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"zh", + "task":"translation_to", "metric":"bleu", - "score":0.3226386416, - "sentence_nr":6 + "score":0.2493415308 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_from", + "model":"google\/gemma-3-27b-it", + "bcp_47":"zh", + "task":"translation_to", "metric":"chrf", - "score":0.6824395077, - "sentence_nr":6 + "score":0.3083774204 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.538368094, - "sentence_nr":6 + "score":0.2106827678 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.7860964064, - "sentence_nr":6 + "score":0.4729315216 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ar", + "task":"translation_to", "metric":"bleu", - "score":0.3830597818, - "sentence_nr":6 + "score":0.1833822876 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ar", + "task":"translation_to", "metric":"chrf", - "score":0.6061131723, - "sentence_nr":6 + "score":0.4592369142 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.3463680071, - "sentence_nr":6 + "score":0.1849279476 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.5167955767, - "sentence_nr":6 + "score":0.4313097332 }, { "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", + "bcp_47":"bn", + "task":"translation_to", "metric":"bleu", - "score":0.3675667566, - "sentence_nr":6 + "score":0.2409740184 }, { "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", + "bcp_47":"bn", + "task":"translation_to", "metric":"chrf", - "score":0.5397693417, - "sentence_nr":6 + "score":0.4412144476 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.4803501445, - "sentence_nr":6 + "score":0.2234676555 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.7417101158, - "sentence_nr":6 + "score":0.4567541675 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"de", + "task":"translation_to", "metric":"bleu", - "score":0.4222184785, - "sentence_nr":6 + "score":0.3260331458 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"de", + "task":"translation_to", "metric":"chrf", - "score":0.6656008733, - "sentence_nr":6 + "score":0.5706133276 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.2404786079, - "sentence_nr":6 + "score":0.1748225206 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.5819897904, - "sentence_nr":6 + "score":0.3715602465 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"en", + "task":"translation_to", "metric":"bleu", - "score":0.2404786079, - "sentence_nr":6 + "score":0.3077182547 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"en", + "task":"translation_to", "metric":"chrf", - "score":0.5819897904, - "sentence_nr":6 + "score":0.5349807426 }, { "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.2404786079, - "sentence_nr":6 + "score":0.1850637388 }, { "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", + "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.5819897904, - "sentence_nr":6 + "score":0.4446871408 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"es", + "task":"translation_to", "metric":"bleu", - "score":0.2404786079, - "sentence_nr":6 + "score":0.3369466851 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"es", + "task":"translation_to", "metric":"chrf", - "score":0.5819897904, - "sentence_nr":6 + "score":0.5877033036 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.4481489512, - "sentence_nr":6 + "score":0.2046187032 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.7994721822, - "sentence_nr":6 + "score":0.4459730588 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fr", + "task":"translation_to", "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 + "score":0.4666795067 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"fr", + "task":"translation_to", "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 + "score":0.6677200822 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 + "score":0.3304821544 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 + "score":0.5478705434 }, { "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", + "bcp_47":"hi", + "task":"translation_to", "metric":"bleu", - "score":0.387540775, - "sentence_nr":6 + "score":0.3530460218 }, { "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", + "bcp_47":"hi", + "task":"translation_to", "metric":"chrf", - "score":0.5985033329, - "sentence_nr":6 + "score":0.558479654 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.5124776603, - "sentence_nr":6 + "score":0.1852494633 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.7722874801, - "sentence_nr":6 + "score":0.4413568977 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"id", + "task":"translation_to", "metric":"bleu", - "score":0.179052784, - "sentence_nr":7 + "score":0.2908938694 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"id", + "task":"translation_to", "metric":"chrf", - "score":0.3725729545, - "sentence_nr":7 + "score":0.5892878712 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.1552160603, - "sentence_nr":7 + "score":0.18258136 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.376453294, - "sentence_nr":7 + "score":0.4537379112 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ja", + "task":"translation_to", "metric":"bleu", - "score":0.1262042989, - "sentence_nr":7 + "score":0.1225657534 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ja", + "task":"translation_to", "metric":"chrf", - "score":0.3558070379, - "sentence_nr":7 + "score":0.199008122 }, { "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.1287222063, - "sentence_nr":7 + "score":0.2245721935 }, { "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.3360263395, - "sentence_nr":7 + "score":0.4151722512 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"jv", + "task":"translation_to", "metric":"bleu", - "score":0.1446578398, - "sentence_nr":7 + "score":0.2248935322 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"jv", + "task":"translation_to", "metric":"chrf", - "score":0.3030283215, - "sentence_nr":7 + "score":0.5061056827 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.1418524086, - "sentence_nr":7 + "score":0.1740373958 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.3829577077, - "sentence_nr":7 + "score":0.45132413 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"mr", + "task":"translation_to", "metric":"bleu", - "score":0.1526801905, - "sentence_nr":7 + "score":0.1932088011 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"mr", + "task":"translation_to", "metric":"chrf", - "score":0.4102875762, - "sentence_nr":7 + "score":0.4185660328 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.0308601662, - "sentence_nr":7 + "score":0.1523314336 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.1100250144, - "sentence_nr":7 + "score":0.3644985981 }, { "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", + "bcp_47":"pa", + "task":"translation_to", "metric":"bleu", - "score":0.2125532771, - "sentence_nr":7 + "score":0.1654328825 }, { "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", + "bcp_47":"pa", + "task":"translation_to", "metric":"chrf", - "score":0.4327215157, - "sentence_nr":7 + "score":0.3306856997 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.175608616, - "sentence_nr":7 + "score":0.1849607455 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.4284862592, - "sentence_nr":7 + "score":0.4432514335 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"pt", + "task":"translation_to", "metric":"bleu", - "score":0.1738234764, - "sentence_nr":7 + "score":0.3735403041 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"pt", + "task":"translation_to", "metric":"chrf", - "score":0.4061580778, - "sentence_nr":7 + "score":0.6258974903 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.1386817294, - "sentence_nr":7 + "score":0.1542357564 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.3094469764, - "sentence_nr":7 + "score":0.407792192 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ru", + "task":"translation_to", "metric":"bleu", - "score":0.1036185485, - "sentence_nr":7 + "score":0.3023477748 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ru", + "task":"translation_to", "metric":"chrf", - "score":0.3277480271, - "sentence_nr":7 + "score":0.5524877157 }, { "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.1518696932, - "sentence_nr":7 + "score":0.1851974615 }, { "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", + "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.3458120002, - "sentence_nr":7 + "score":0.3965623482 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sw", + "task":"translation_to", "metric":"bleu", - "score":0.1551417935, - "sentence_nr":7 + "score":0.1508209944 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"sw", + "task":"translation_to", "metric":"chrf", - "score":0.3762636488, - "sentence_nr":7 + "score":0.4882487732 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.0943129772, - "sentence_nr":7 + "score":0.1379772803 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.3616856339, - "sentence_nr":7 + "score":0.4107039585 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"te", + "task":"translation_to", "metric":"bleu", - "score":0.1109125268, - "sentence_nr":7 + "score":0.2016846201 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"te", + "task":"translation_to", "metric":"chrf", - "score":0.2660763461, - "sentence_nr":7 + "score":0.4266778738 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":7 + "score":0.175281535 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.1897170832, - "sentence_nr":7 + "score":0.4308484341 }, { "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", + "bcp_47":"ur", + "task":"translation_to", "metric":"bleu", - "score":0.1026674747, - "sentence_nr":7 + "score":0.2117497213 }, { "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", + "bcp_47":"ur", + "task":"translation_to", "metric":"chrf", - "score":0.3364703639, - "sentence_nr":7 + "score":0.3938011024 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.1532505429, - "sentence_nr":7 + "score":0.1357518844 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.4125406717, - "sentence_nr":7 + "score":0.3722986269 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"vi", + "task":"translation_to", "metric":"bleu", - "score":0.145578084, - "sentence_nr":7 + "score":0.2732555305 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"vi", + "task":"translation_to", "metric":"chrf", - "score":0.3659834676, - "sentence_nr":7 + "score":0.5379510442 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.1815495479, - "sentence_nr":7 + "score":0.1738291666 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.4557483776, - "sentence_nr":7 + "score":0.4357500531 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"zh", + "task":"translation_to", "metric":"bleu", - "score":0.0689753389, - "sentence_nr":7 + "score":0.1521172398 + }, + { + "model":"meta-llama\/llama-3-70b-instruct", + "bcp_47":"zh", + "task":"translation_to", + "metric":"chrf", + "score":0.2131109353 }, { "model":"meta-llama\/llama-3.1-70b-instruct", "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.2776666563, - "sentence_nr":7 + "task":"mmlu", + "metric":"accuracy", + "score":0.9 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"meta-llama\/llama-3.1-70b-instruct", "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.1665765483, - "sentence_nr":7 + "score":0.2599940834 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"meta-llama\/llama-3.1-70b-instruct", "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.4017968725, - "sentence_nr":7 + "score":0.5344413165 }, { - "model":"openai\/gpt-4.1-mini", + "model":"meta-llama\/llama-3.1-70b-instruct", "bcp_47":"ar", - "task":"translation_from", + "task":"translation_to", "metric":"bleu", - "score":0.1052201444, - "sentence_nr":7 + "score":0.3535082667 }, { - "model":"openai\/gpt-4.1-mini", + "model":"meta-llama\/llama-3.1-70b-instruct", "bcp_47":"ar", - "task":"translation_from", + "task":"translation_to", "metric":"chrf", - "score":0.3254405154, - "sentence_nr":7 + "score":0.5618696854 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1678010916, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3968694015, - "sentence_nr":7 + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.1381751569, - "sentence_nr":7 + "score":0.2354383205 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.3121557499, - "sentence_nr":7 + "score":0.4808197348 }, { "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", + "bcp_47":"bn", + "task":"translation_to", "metric":"bleu", - "score":0.1579497466, - "sentence_nr":7 + "score":0.3199525151 }, { "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", + "bcp_47":"bn", + "task":"translation_to", "metric":"chrf", - "score":0.5092928546, - "sentence_nr":7 + "score":0.499911007 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.162868761, - "sentence_nr":7 + "score":0.3087730646 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.3422914837, - "sentence_nr":7 + "score":0.5446110065 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"de", + "task":"translation_to", "metric":"bleu", - "score":0.2489421388, - "sentence_nr":7 + "score":0.4363239189 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"de", + "task":"translation_to", "metric":"chrf", - "score":0.4083799714, - "sentence_nr":7 + "score":0.6606949091 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.1169764262, - "sentence_nr":7 + "score":0.5339078139 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.3711775364, - "sentence_nr":7 + "score":0.6892570142 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"en", + "task":"translation_to", "metric":"bleu", - "score":0.2006511507, - "sentence_nr":7 + "score":0.6674605684 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"en", + "task":"translation_to", "metric":"chrf", - "score":0.4084885616, - "sentence_nr":7 + "score":0.804371781 }, { "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":7 + "score":0.2419716374 }, { "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", + "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.1762196387, - "sentence_nr":7 + "score":0.507956668 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"es", + "task":"translation_to", "metric":"bleu", - "score":0.0991614609, - "sentence_nr":7 + "score":0.3634368286 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"es", + "task":"translation_to", "metric":"chrf", - "score":0.3121110161, - "sentence_nr":7 + "score":0.5899847818 }, { - "model":"openai\/gpt-4.1-mini", + "model":"meta-llama\/llama-3.1-70b-instruct", "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.156345665, - "sentence_nr":7 + "task":"mmlu", + "metric":"accuracy", + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", + "model":"meta-llama\/llama-3.1-70b-instruct", "bcp_47":"fr", "task":"translation_from", - "metric":"chrf", - "score":0.4110013716, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", "metric":"bleu", - "score":0.1380561569, - "sentence_nr":7 + "score":0.2344633197 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.4078799873, - "sentence_nr":7 + "score":0.5330179435 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fr", + "task":"translation_to", "metric":"bleu", - "score":0.122912191, - "sentence_nr":7 + "score":0.4911890131 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"fr", + "task":"translation_to", "metric":"chrf", - "score":0.3448002181, - "sentence_nr":7 + "score":0.6961788043 }, { "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1764307831, - "sentence_nr":7 + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 }, { "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4075758479, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", + "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.1989414239, - "sentence_nr":7 + "score":0.3846763493 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.3791567777, - "sentence_nr":7 + "score":0.6011964597 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"hi", + "task":"translation_to", "metric":"bleu", - "score":0.1947336505, - "sentence_nr":7 + "score":0.4163962042 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"hi", + "task":"translation_to", "metric":"chrf", - "score":0.4169850144, - "sentence_nr":7 + "score":0.6196043433 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.1914828287, - "sentence_nr":7 + "score":0.2757294842 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.4707949702, - "sentence_nr":7 + "score":0.5164990805 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"id", + "task":"translation_to", "metric":"bleu", - "score":0.2060857231, - "sentence_nr":7 + "score":0.2979743631 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"id", + "task":"translation_to", "metric":"chrf", - "score":0.4704943906, - "sentence_nr":7 + "score":0.621505647 }, { "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.0818335366, - "sentence_nr":7 + "score":0.3952954307 }, { "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.2500763339, - "sentence_nr":7 + "score":0.6095092587 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ja", + "task":"translation_to", "metric":"bleu", - "score":0.0981642546, - "sentence_nr":7 + "score":0.3550137141 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ja", + "task":"translation_to", "metric":"chrf", - "score":0.3179322233, - "sentence_nr":7 + "score":0.4750629972 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.1643920943, - "sentence_nr":7 + "score":0.2908958438 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.4076099284, - "sentence_nr":7 + "score":0.5056906446 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"jv", + "task":"translation_to", "metric":"bleu", - "score":0.1215724157, - "sentence_nr":7 + "score":0.278835165 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"jv", + "task":"translation_to", "metric":"chrf", - "score":0.4080990098, - "sentence_nr":7 + "score":0.4936217166 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.0854164839, - "sentence_nr":7 + "score":0.2506634169 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.2825804067, - "sentence_nr":7 + "score":0.4822339063 }, { "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", + "bcp_47":"mr", + "task":"translation_to", "metric":"bleu", - "score":0.1041529816, - "sentence_nr":7 + "score":0.1977398 }, { "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", + "bcp_47":"mr", + "task":"translation_to", "metric":"chrf", - "score":0.3345263292, - "sentence_nr":7 + "score":0.4512527967 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"meta-llama\/llama-3.1-70b-instruct", "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.2120423927, - "sentence_nr":7 + "score":0.4150075487 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"meta-llama\/llama-3.1-70b-instruct", "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.3846197304, - "sentence_nr":7 + "score":0.5859289925 }, { - "model":"openai\/gpt-4.1-mini", + "model":"meta-llama\/llama-3.1-70b-instruct", "bcp_47":"pa", - "task":"translation_from", + "task":"translation_to", "metric":"bleu", - "score":0.1869333815, - "sentence_nr":7 + "score":0.4055714442 }, { - "model":"openai\/gpt-4.1-mini", + "model":"meta-llama\/llama-3.1-70b-instruct", "bcp_47":"pa", - "task":"translation_from", + "task":"translation_to", "metric":"chrf", - "score":0.4290809947, - "sentence_nr":7 + "score":0.5640351838 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.1643188797, - "sentence_nr":7 + "score":0.3043299439 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.4088971379, - "sentence_nr":7 + "score":0.535196717 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"pt", + "task":"translation_to", "metric":"bleu", - "score":0.1145250892, - "sentence_nr":7 + "score":0.4680489994 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"pt", + "task":"translation_to", "metric":"chrf", - "score":0.3212742401, - "sentence_nr":7 + "score":0.6589781804 }, { "model":"meta-llama\/llama-3.1-70b-instruct", "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0821835945, - "sentence_nr":7 + "task":"mmlu", + "metric":"accuracy", + "score":0.8 }, { "model":"meta-llama\/llama-3.1-70b-instruct", "bcp_47":"ru", "task":"translation_from", - "metric":"chrf", - "score":0.2390539176, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", "metric":"bleu", - "score":0.1767383562, - "sentence_nr":7 + "score":0.222732943 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"meta-llama\/llama-3.1-70b-instruct", "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.390208518, - "sentence_nr":7 + "score":0.4930414776 }, { - "model":"openai\/gpt-4.1-mini", + "model":"meta-llama\/llama-3.1-70b-instruct", "bcp_47":"ru", - "task":"translation_from", + "task":"translation_to", "metric":"bleu", - "score":0.1960939563, - "sentence_nr":7 + "score":0.338298129 }, { - "model":"openai\/gpt-4.1-mini", + "model":"meta-llama\/llama-3.1-70b-instruct", "bcp_47":"ru", - "task":"translation_from", + "task":"translation_to", "metric":"chrf", - "score":0.4429882447, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1518427872, - "sentence_nr":7 + "score":0.5638349443 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"meta-llama\/llama-3.1-70b-instruct", "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4093399938, - "sentence_nr":7 + "task":"mmlu", + "metric":"accuracy", + "score":0.8 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"meta-llama\/llama-3.1-70b-instruct", "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.1547822267, - "sentence_nr":7 + "score":0.2821010087 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"meta-llama\/llama-3.1-70b-instruct", "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.355058476, - "sentence_nr":7 + "score":0.5068790976 }, { "model":"meta-llama\/llama-3.1-70b-instruct", "bcp_47":"sw", - "task":"translation_from", + "task":"translation_to", "metric":"bleu", - "score":0.0624444512, - "sentence_nr":7 + "score":0.2757507483 }, { "model":"meta-llama\/llama-3.1-70b-instruct", "bcp_47":"sw", - "task":"translation_from", + "task":"translation_to", "metric":"chrf", - "score":0.2823983493, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1568563265, - "sentence_nr":7 + "score":0.5718564064 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3437829588, - "sentence_nr":7 + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.0826693165, - "sentence_nr":7 + "score":0.2421646919 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.3127511921, - "sentence_nr":7 + "score":0.4745308575 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"te", + "task":"translation_to", "metric":"bleu", - "score":0.5989315087, - "sentence_nr":8 + "score":0.2617143353 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"te", + "task":"translation_to", "metric":"chrf", - "score":0.7353063746, - "sentence_nr":8 + "score":0.5319635422 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.3067706489, - "sentence_nr":8 + "score":0.2376372003 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.5308555945, - "sentence_nr":8 + "score":0.4703124968 }, { "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", + "bcp_47":"ur", + "task":"translation_to", "metric":"bleu", - "score":0.1327526848, - "sentence_nr":8 + "score":0.2981093662 }, { "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", + "bcp_47":"ur", + "task":"translation_to", "metric":"chrf", - "score":0.3785060249, - "sentence_nr":8 + "score":0.4567172276 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.1840503544, - "sentence_nr":8 + "score":0.2436649491 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.414290109, - "sentence_nr":8 + "score":0.4800401855 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"vi", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":8 + "score":0.3190461612 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", + "model":"meta-llama\/llama-3.1-70b-instruct", + "bcp_47":"vi", + "task":"translation_to", "metric":"chrf", - "score":0.3381363586, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4262221594, - "sentence_nr":8 + "score":0.5738845596 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"meta-llama\/llama-3.1-70b-instruct", "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5886657415, - "sentence_nr":8 + "task":"mmlu", + "metric":"accuracy", + "score":0.8 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"meta-llama\/llama-3.1-70b-instruct", "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.2866084411, - "sentence_nr":8 + "score":0.241579409 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"meta-llama\/llama-3.1-70b-instruct", "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.4579283646, - "sentence_nr":8 + "score":0.4834754638 }, { "model":"meta-llama\/llama-3.1-70b-instruct", "bcp_47":"zh", - "task":"translation_from", + "task":"translation_to", "metric":"bleu", - "score":0.2586113059, - "sentence_nr":8 + "score":0.2521936889 }, { "model":"meta-llama\/llama-3.1-70b-instruct", "bcp_47":"zh", - "task":"translation_from", + "task":"translation_to", "metric":"chrf", - "score":0.3945264409, - "sentence_nr":8 + "score":0.3101863746 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.2037925062, - "sentence_nr":8 + "score":0.2693485281 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.4108541431, - "sentence_nr":8 + "score":0.526972026 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ar", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":8 + "score":0.299118757 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ar", + "task":"translation_to", "metric":"chrf", - "score":0.1691326883, - "sentence_nr":8 + "score":0.5209634099 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.431864811, - "sentence_nr":8 + "score":0.2349115906 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.5792139687, - "sentence_nr":8 + "score":0.4958748831 }, { "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "bcp_47":"bn", + "task":"translation_to", "metric":"bleu", - "score":0.3089009202, - "sentence_nr":8 + "score":0.3037551079 }, { "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "bcp_47":"bn", + "task":"translation_to", "metric":"chrf", - "score":0.5553909583, - "sentence_nr":8 + "score":0.5104197052 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.3089009202, - "sentence_nr":8 + "score":0.2940412827 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.5553909583, - "sentence_nr":8 + "score":0.5289123372 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"de", + "task":"translation_to", "metric":"bleu", - "score":0.2579872309, - "sentence_nr":8 + "score":0.4945548288 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"de", + "task":"translation_to", "metric":"chrf", - "score":0.524485423, - "sentence_nr":8 + "score":0.6883045723 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.3089009202, - "sentence_nr":8 + "score":0.5254997328 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.5553909583, - "sentence_nr":8 + "score":0.6651833212 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"en", + "task":"translation_to", "metric":"bleu", - "score":0.4609261192, - "sentence_nr":8 + "score":0.6367218418 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"en", + "task":"translation_to", "metric":"chrf", - "score":0.6365915339, - "sentence_nr":8 + "score":0.7901906482 }, { "model":"meta-llama\/llama-3.3-70b-instruct", "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1690979933, - "sentence_nr":8 + "task":"mmlu", + "metric":"accuracy", + "score":0.8 }, { "model":"meta-llama\/llama-3.3-70b-instruct", "bcp_47":"es", "task":"translation_from", - "metric":"chrf", - "score":0.3751861276, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":8 + "score":0.2547596952 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"meta-llama\/llama-3.3-70b-instruct", "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.3344305109, - "sentence_nr":8 + "score":0.5121489935 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"meta-llama\/llama-3.3-70b-instruct", "bcp_47":"es", - "task":"translation_from", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":8 + "score":0.3970366728 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"meta-llama\/llama-3.3-70b-instruct", "bcp_47":"es", - "task":"translation_from", + "task":"translation_to", "metric":"chrf", - "score":0.3701750146, - "sentence_nr":8 + "score":0.6218247901 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.2283032715, - "sentence_nr":8 + "score":0.2933660925 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.4341368545, - "sentence_nr":8 + "score":0.5571361609 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fr", + "task":"translation_to", "metric":"bleu", - "score":0.5234484809, - "sentence_nr":8 + "score":0.5068230898 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"fr", + "task":"translation_to", "metric":"chrf", - "score":0.6658297774, - "sentence_nr":8 + "score":0.6748037018 }, { "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.2840563957, - "sentence_nr":8 + "score":0.343226497 }, { "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", + "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.5110250591, - "sentence_nr":8 + "score":0.5766444084 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"hi", + "task":"translation_to", "metric":"bleu", - "score":0.3000750469, - "sentence_nr":8 + "score":0.3910462734 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"hi", + "task":"translation_to", "metric":"chrf", - "score":0.5153810823, - "sentence_nr":8 + "score":0.5964148868 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.1407495777, - "sentence_nr":8 + "score":0.2823009881 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.3750035199, - "sentence_nr":8 + "score":0.5398328113 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"id", + "task":"translation_to", "metric":"bleu", - "score":0.2543269102, - "sentence_nr":8 + "score":0.3103565141 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"id", + "task":"translation_to", "metric":"chrf", - "score":0.4829947079, - "sentence_nr":8 + "score":0.6174908793 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.3815250265, - "sentence_nr":8 + "score":0.3323087124 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.6516314752, - "sentence_nr":8 + "score":0.5573643434 }, { "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", + "bcp_47":"ja", + "task":"translation_to", "metric":"bleu", - "score":0.1992041348, - "sentence_nr":8 + "score":0.3398063689 }, { "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", + "bcp_47":"ja", + "task":"translation_to", "metric":"chrf", - "score":0.4253779693, - "sentence_nr":8 + "score":0.439612207 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.1899029242, - "sentence_nr":8 + "score":0.3202476462 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.407218439, - "sentence_nr":8 + "score":0.5170575936 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"jv", + "task":"translation_to", "metric":"bleu", - "score":0.1871026059, - "sentence_nr":8 + "score":0.2655261196 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"jv", + "task":"translation_to", "metric":"chrf", - "score":0.4433431372, - "sentence_nr":8 + "score":0.5078431653 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.2049841563, - "sentence_nr":8 + "score":0.2672781462 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.4155916631, - "sentence_nr":8 + "score":0.5076383126 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"mr", + "task":"translation_to", "metric":"bleu", - "score":0.4000381043, - "sentence_nr":8 + "score":0.1627869169 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"mr", + "task":"translation_to", "metric":"chrf", - "score":0.5899097408, - "sentence_nr":8 + "score":0.4085690767 }, { "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.2040179688, - "sentence_nr":8 + "score":0.4343597896 }, { "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.4331763045, - "sentence_nr":8 + "score":0.612284022 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"pa", + "task":"translation_to", "metric":"bleu", - "score":0.2097387762, - "sentence_nr":8 + "score":0.4056628693 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"pa", + "task":"translation_to", "metric":"chrf", - "score":0.4966330151, - "sentence_nr":8 + "score":0.577470079 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.2706716802, - "sentence_nr":8 + "score":0.2561623538 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.5439625482, - "sentence_nr":8 + "score":0.5084673727 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"pt", + "task":"translation_to", "metric":"bleu", - "score":0.3337338879, - "sentence_nr":8 + "score":0.4822378549 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"pt", + "task":"translation_to", "metric":"chrf", - "score":0.550089922, - "sentence_nr":8 + "score":0.6805267649 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.3804753173, - "sentence_nr":8 + "score":0.2002083293 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.494857231, - "sentence_nr":8 + "score":0.4701113234 }, { "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", + "bcp_47":"ru", + "task":"translation_to", "metric":"bleu", - "score":0.204488707, - "sentence_nr":8 + "score":0.3404957825 }, { "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", + "bcp_47":"ru", + "task":"translation_to", "metric":"chrf", - "score":0.3847158513, - "sentence_nr":8 + "score":0.5535956904 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.2309552735, - "sentence_nr":8 + "score":0.2378532768 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.4672309378, - "sentence_nr":8 + "score":0.488547843 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sw", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":8 + "score":0.265213578 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"sw", + "task":"translation_to", "metric":"chrf", - "score":0.2988665867, - "sentence_nr":8 + "score":0.5688332618 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":8 + "score":0.2212863699 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.327060774, - "sentence_nr":8 + "score":0.4840600136 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"te", + "task":"translation_to", "metric":"bleu", - "score":0.448923596, - "sentence_nr":8 + "score":0.2690593843 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"te", + "task":"translation_to", "metric":"chrf", - "score":0.5934678825, - "sentence_nr":8 + "score":0.5097708439 }, { "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.298050419, - "sentence_nr":8 + "score":0.2689156709 }, { "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.510126892, - "sentence_nr":8 + "score":0.5166231119 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ur", + "task":"translation_to", "metric":"bleu", - "score":0.2880086933, - "sentence_nr":8 + "score":0.2395415037 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"ur", + "task":"translation_to", "metric":"chrf", - "score":0.4934867862, - "sentence_nr":8 + "score":0.4291961624 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.2429163097, - "sentence_nr":8 + "score":0.1514958599 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.5044329486, - "sentence_nr":8 + "score":0.393503436 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"vi", + "task":"translation_to", "metric":"bleu", - "score":0.3205104057, - "sentence_nr":8 + "score":0.3126864004 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_from", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"vi", + "task":"translation_to", "metric":"chrf", - "score":0.584870798, - "sentence_nr":8 + "score":0.5612804645 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.4683276331, - "sentence_nr":8 + "score":0.2120665528 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", + "model":"meta-llama\/llama-3.3-70b-instruct", + "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.8176110135, - "sentence_nr":8 + "score":0.473531494 }, { "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", + "bcp_47":"zh", + "task":"translation_to", "metric":"bleu", - "score":0.9436043262, - "sentence_nr":8 + "score":0.2450622208 }, { "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", + "bcp_47":"zh", + "task":"translation_to", "metric":"chrf", - "score":0.988019168, - "sentence_nr":8 + "score":0.3218418642 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":1.0, - "sentence_nr":8 + "score":0.296505833 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":1.0, - "sentence_nr":8 + "score":0.5400572519 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ar", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":8 + "score":0.340461259 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ar", + "task":"translation_to", "metric":"chrf", - "score":0.0067104199, - "sentence_nr":8 + "score":0.5619514904 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":1.0, - "sentence_nr":8 + "score":0.2759322818 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":1.0, - "sentence_nr":8 + "score":0.520565338 }, { "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_from", + "bcp_47":"bn", + "task":"translation_to", "metric":"bleu", - "score":0.3642482473, - "sentence_nr":8 + "score":0.338451158 }, { "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_from", + "bcp_47":"bn", + "task":"translation_to", "metric":"chrf", - "score":0.5342538783, - "sentence_nr":8 + "score":0.5187985166 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.188319335, - "sentence_nr":8 + "score":0.3759519266 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.4318025704, - "sentence_nr":8 + "score":0.5897372465 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"de", + "task":"translation_to", "metric":"bleu", - "score":0.4439623528, - "sentence_nr":8 + "score":0.4241869609 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"de", + "task":"translation_to", "metric":"chrf", - "score":0.5309137919, - "sentence_nr":8 + "score":0.6369588457 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":8 + "score":0.5411864684 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.2628849077, - "sentence_nr":8 + "score":0.6967802953 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"en", + "task":"translation_to", "metric":"bleu", - "score":0.2375594795, - "sentence_nr":8 + "score":0.6482731713 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"en", + "task":"translation_to", "metric":"chrf", - "score":0.4291541973, - "sentence_nr":8 + "score":0.8116769221 }, { "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.284061369, - "sentence_nr":8 + "score":0.2922155838 }, { "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", + "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.5649283064, - "sentence_nr":8 + "score":0.5497719853 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"es", + "task":"translation_to", "metric":"bleu", - "score":0.2154402759, - "sentence_nr":8 + "score":0.338476596 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"es", + "task":"translation_to", "metric":"chrf", - "score":0.5040038441, - "sentence_nr":8 + "score":0.5745067933 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":8 + "score":0.2953732107 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.2855212789, - "sentence_nr":8 + "score":0.5548969581 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fr", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":8 + "score":0.5304234655 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"fr", + "task":"translation_to", "metric":"chrf", - "score":0.1644894761, - "sentence_nr":8 + "score":0.7109575095 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":8 + "score":0.3775698519 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.2364455179, - "sentence_nr":8 + "score":0.5982891247 }, { "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", + "bcp_47":"hi", + "task":"translation_to", "metric":"bleu", - "score":0.1855954214, - "sentence_nr":9 + "score":0.3986854808 }, { "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", + "bcp_47":"hi", + "task":"translation_to", "metric":"chrf", - "score":0.3804842883, - "sentence_nr":9 + "score":0.591115524 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3536937539, - "sentence_nr":9 + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.1308768293, - "sentence_nr":9 + "score":0.2279863353 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.1946295298, - "sentence_nr":9 + "score":0.5022597218 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"id", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":9 + "score":0.3892094891 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"id", + "task":"translation_to", "metric":"chrf", - "score":0.0135384977, - "sentence_nr":9 + "score":0.6520141168 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.3375178722, - "sentence_nr":9 + "score":0.3788371121 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.4840651439, - "sentence_nr":9 + "score":0.6055484505 }, { "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", + "bcp_47":"ja", + "task":"translation_to", "metric":"bleu", - "score":0.1512218921, - "sentence_nr":9 + "score":0.3351360505 }, { "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", + "bcp_47":"ja", + "task":"translation_to", "metric":"chrf", - "score":0.2675011051, - "sentence_nr":9 + "score":0.4702609655 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.1075992769, - "sentence_nr":9 + "score":0.3432613501 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.2106579454, - "sentence_nr":9 + "score":0.5702557631 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"jv", + "task":"translation_to", "metric":"bleu", - "score":0.0784377299, - "sentence_nr":9 + "score":0.2987779883 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"jv", + "task":"translation_to", "metric":"chrf", - "score":0.1324578892, - "sentence_nr":9 + "score":0.5727527461 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":9 + "score":0.245468889 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.0816397707, - "sentence_nr":9 + "score":0.5195139142 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"mr", + "task":"translation_to", "metric":"bleu", - "score":0.1617131493, - "sentence_nr":9 + "score":0.2246556712 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"mr", + "task":"translation_to", "metric":"chrf", - "score":0.2876418496, - "sentence_nr":9 + "score":0.4485577055 }, { "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.2168548583, - "sentence_nr":9 + "score":0.4116477856 }, { "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.3714219747, - "sentence_nr":9 + "score":0.6206199646 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"pa", + "task":"translation_to", "metric":"bleu", - "score":0.1227409298, - "sentence_nr":9 + "score":0.4995455509 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"pa", + "task":"translation_to", "metric":"chrf", - "score":0.3385513652, - "sentence_nr":9 + "score":0.619445933 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.1463197333, - "sentence_nr":9 + "score":0.3804523937 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.3661372734, - "sentence_nr":9 + "score":0.5992357582 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"pt", + "task":"translation_to", "metric":"bleu", - "score":0.1265649403, - "sentence_nr":9 + "score":0.4118835999 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"pt", + "task":"translation_to", "metric":"chrf", - "score":0.3156355831, - "sentence_nr":9 + "score":0.6402783366 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.2496001284, - "sentence_nr":9 + "score":0.2711737241 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.4448983036, - "sentence_nr":9 + "score":0.5223358319 }, { "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", + "bcp_47":"ru", + "task":"translation_to", "metric":"bleu", - "score":0.1122890322, - "sentence_nr":9 + "score":0.3600231378 }, { "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", + "bcp_47":"ru", + "task":"translation_to", "metric":"chrf", - "score":0.1772610005, - "sentence_nr":9 + "score":0.5851662403 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":9 + "score":0.2816996366 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.3101771609, - "sentence_nr":9 + "score":0.5425859416 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sw", + "task":"translation_to", "metric":"bleu", - "score":0.1427671612, - "sentence_nr":9 + "score":0.3295094623 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"sw", + "task":"translation_to", "metric":"chrf", - "score":0.3191375425, - "sentence_nr":9 + "score":0.6093047217 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":9 + "score":0.3372428289 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.0223039199, - "sentence_nr":9 + "score":0.5687146545 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"te", + "task":"translation_to", "metric":"bleu", - "score":0.2676522616, - "sentence_nr":9 + "score":0.3362998921 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"te", + "task":"translation_to", "metric":"chrf", - "score":0.4201493552, - "sentence_nr":9 + "score":0.5480115484 }, { "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":9 + "score":0.2130096226 }, { "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.3710595253, - "sentence_nr":9 + "score":0.4588260908 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ur", + "task":"translation_to", "metric":"bleu", - "score":0.2168828306, - "sentence_nr":9 + "score":0.2672672187 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"ur", + "task":"translation_to", "metric":"chrf", - "score":0.4177582416, - "sentence_nr":9 + "score":0.4657426772 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.182352473, - "sentence_nr":9 + "score":0.1973356715 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.4077952398, - "sentence_nr":9 + "score":0.4598464437 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"vi", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":9 + "score":0.3356973056 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"vi", + "task":"translation_to", "metric":"chrf", - "score":0.0139152884, - "sentence_nr":9 + "score":0.6057343387 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.1949274978, - "sentence_nr":9 + "score":0.2839664983 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", + "model":"meta-llama\/llama-4-maverick", + "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.4345593627, - "sentence_nr":9 + "score":0.5496970367 }, { "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", + "bcp_47":"zh", + "task":"translation_to", "metric":"bleu", - "score":0.1266637216, - "sentence_nr":9 + "score":0.2404693379 }, { "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", + "bcp_47":"zh", + "task":"translation_to", "metric":"chrf", - "score":0.2650373529, - "sentence_nr":9 + "score":0.2741729656 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"microsoft\/phi-4", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.1216277939, - "sentence_nr":9 + "score":0.1333199947 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"microsoft\/phi-4", + "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.3228288841, - "sentence_nr":9 + "score":0.3787420394 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", + "model":"microsoft\/phi-4", + "bcp_47":"ar", + "task":"translation_to", "metric":"bleu", - "score":0.1649662542, - "sentence_nr":9 + "score":0.2639924417 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", + "model":"microsoft\/phi-4", + "bcp_47":"ar", + "task":"translation_to", "metric":"chrf", - "score":0.3466546857, - "sentence_nr":9 + "score":0.4508419338 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", + "model":"microsoft\/phi-4", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":9 + "score":0.0781077372 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", + "model":"microsoft\/phi-4", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.0153696674, - "sentence_nr":9 + "score":0.3675270991 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", + "model":"microsoft\/phi-4", + "bcp_47":"bn", + "task":"translation_to", "metric":"bleu", - "score":0.1588436203, - "sentence_nr":9 + "score":0.1386482919 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", + "model":"microsoft\/phi-4", + "bcp_47":"bn", + "task":"translation_to", "metric":"chrf", - "score":0.3981499896, - "sentence_nr":9 + "score":0.3721300124 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", + "model":"microsoft\/phi-4", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.2032648426, - "sentence_nr":9 + "score":0.2182705396 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", + "model":"microsoft\/phi-4", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.2922087191, - "sentence_nr":9 + "score":0.4808885751 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"microsoft\/phi-4", + "bcp_47":"de", + "task":"translation_to", "metric":"bleu", - "score":0.1823759948, - "sentence_nr":9 + "score":0.3009940804 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"microsoft\/phi-4", + "bcp_47":"de", + "task":"translation_to", "metric":"chrf", - "score":0.3740403512, - "sentence_nr":9 + "score":0.5563863941 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", + "model":"microsoft\/phi-4", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":9 + "score":0.3417051248 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", + "model":"microsoft\/phi-4", + "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.2244748716, - "sentence_nr":9 + "score":0.5564910783 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"microsoft\/phi-4", + "bcp_47":"en", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":9 + "score":0.505573911 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", + "model":"microsoft\/phi-4", + "bcp_47":"en", + "task":"translation_to", "metric":"chrf", - "score":0.0072819069, - "sentence_nr":9 + "score":0.7036775988 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", + "model":"microsoft\/phi-4", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.3662268411, - "sentence_nr":9 + "score":0.162581322 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", + "model":"microsoft\/phi-4", + "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.5409038674, - "sentence_nr":9 + "score":0.4452830938 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", + "model":"microsoft\/phi-4", + "bcp_47":"es", + "task":"translation_to", "metric":"bleu", - "score":0.1740044679, - "sentence_nr":9 + "score":0.3120471917 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", + "model":"microsoft\/phi-4", + "bcp_47":"es", + "task":"translation_to", "metric":"chrf", - "score":0.3637515238, - "sentence_nr":9 + "score":0.5521181062 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", + "model":"microsoft\/phi-4", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.1287668952, - "sentence_nr":9 + "score":0.1841410036 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", + "model":"microsoft\/phi-4", + "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.3253153379, - "sentence_nr":9 + "score":0.4498873761 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", + "model":"microsoft\/phi-4", + "bcp_47":"fr", + "task":"translation_to", "metric":"bleu", - "score":0.1326935302, - "sentence_nr":9 + "score":0.3957930078 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", + "model":"microsoft\/phi-4", + "bcp_47":"fr", + "task":"translation_to", "metric":"chrf", - "score":0.2899808984, - "sentence_nr":9 + "score":0.5908491177 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", + "model":"microsoft\/phi-4", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":9 + "score":0.2781818374 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", + "model":"microsoft\/phi-4", + "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.013575256, - "sentence_nr":9 + "score":0.5317078224 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", + "model":"microsoft\/phi-4", + "bcp_47":"hi", + "task":"translation_to", "metric":"bleu", - "score":0.2592282745, - "sentence_nr":9 + "score":0.2082459717 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", + "model":"microsoft\/phi-4", + "bcp_47":"hi", + "task":"translation_to", "metric":"chrf", - "score":0.3913113625, - "sentence_nr":9 + "score":0.3612751063 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", + "model":"microsoft\/phi-4", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.3227889517, - "sentence_nr":9 + "score":0.14109102 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", + "model":"microsoft\/phi-4", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.4026302132, - "sentence_nr":9 + "score":0.4206086243 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"microsoft\/phi-4", + "bcp_47":"id", + "task":"translation_to", "metric":"bleu", - "score":0.1191597493, - "sentence_nr":9 + "score":0.2541374481 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"microsoft\/phi-4", + "bcp_47":"id", + "task":"translation_to", "metric":"chrf", - "score":0.2129794266, - "sentence_nr":9 + "score":0.5738191205 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", + "model":"microsoft\/phi-4", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.140502651, - "sentence_nr":9 + "score":0.217631862 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", + "model":"microsoft\/phi-4", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.2478525818, - "sentence_nr":9 + "score":0.4810988251 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"microsoft\/phi-4", + "bcp_47":"ja", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":9 + "score":0.3314270444 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", + "model":"microsoft\/phi-4", + "bcp_47":"ja", + "task":"translation_to", "metric":"chrf", - "score":0.0223039199, - "sentence_nr":9 + "score":0.4579736168 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", + "model":"microsoft\/phi-4", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.2791576982, - "sentence_nr":9 + "score":0.1369006135 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", + "model":"microsoft\/phi-4", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.369632421, - "sentence_nr":9 + "score":0.3726552499 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", + "model":"microsoft\/phi-4", + "bcp_47":"jv", + "task":"translation_to", "metric":"bleu", - "score":0.1692546646, - "sentence_nr":9 + "score":0.1358290891 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", + "model":"microsoft\/phi-4", + "bcp_47":"jv", + "task":"translation_to", "metric":"chrf", - "score":0.3591239885, - "sentence_nr":9 + "score":0.4485195299 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", + "model":"microsoft\/phi-4", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.2036348471, - "sentence_nr":9 + "score":0.1220522034 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", + "model":"microsoft\/phi-4", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.3472831656, - "sentence_nr":9 + "score":0.394432105 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", + "model":"microsoft\/phi-4", + "bcp_47":"mr", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":9 + "score":0.0877294163 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", + "model":"microsoft\/phi-4", + "bcp_47":"mr", + "task":"translation_to", "metric":"chrf", - "score":0.2154769743, - "sentence_nr":9 + "score":0.3228035874 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"microsoft\/phi-4", "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":9 + "score":0.2872682457 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"microsoft\/phi-4", "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.180399603, - "sentence_nr":9 + "score":0.5343897569 }, { - "model":"openai\/gpt-4.1-mini", + "model":"microsoft\/phi-4", "bcp_47":"pa", - "task":"translation_from", + "task":"translation_to", "metric":"bleu", - "score":0.1464506683, - "sentence_nr":9 + "score":0.2344910913 }, { - "model":"openai\/gpt-4.1-mini", + "model":"microsoft\/phi-4", "bcp_47":"pa", - "task":"translation_from", + "task":"translation_to", "metric":"chrf", - "score":0.348347983, - "sentence_nr":9 + "score":0.4302635187 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", + "model":"microsoft\/phi-4", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.2327080491, - "sentence_nr":9 + "score":0.1578818745 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", + "model":"microsoft\/phi-4", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.4213315211, - "sentence_nr":9 + "score":0.4563510644 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", + "model":"microsoft\/phi-4", + "bcp_47":"pt", + "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":9 + "score":0.3548341797 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", + "model":"microsoft\/phi-4", + "bcp_47":"pt", + "task":"translation_to", "metric":"chrf", - "score":0.2436235351, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1400583077, - "sentence_nr":9 + "score":0.5851699932 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"microsoft\/phi-4", "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.2827131457, - "sentence_nr":9 + "task":"mmlu", + "metric":"accuracy", + "score":0.6 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"microsoft\/phi-4", "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":9 + "score":0.1518810674 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"microsoft\/phi-4", "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.0194337786, - "sentence_nr":9 + "score":0.4229373334 }, { - "model":"openai\/gpt-4.1-mini", + "model":"microsoft\/phi-4", "bcp_47":"ru", - "task":"translation_from", + "task":"translation_to", "metric":"bleu", - "score":0.3114449377, - "sentence_nr":9 + "score":0.280180123 }, { - "model":"openai\/gpt-4.1-mini", + "model":"microsoft\/phi-4", "bcp_47":"ru", - "task":"translation_from", + "task":"translation_to", "metric":"chrf", - "score":0.4723803506, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 + "score":0.5388785418 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"microsoft\/phi-4", "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2568191876, - "sentence_nr":9 + "task":"mmlu", + "metric":"accuracy", + "score":0.5 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"microsoft\/phi-4", "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":9 + "score":0.1197479462 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"microsoft\/phi-4", "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.2813584915, - "sentence_nr":9 + "score":0.3847229786 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"microsoft\/phi-4", "bcp_47":"sw", - "task":"translation_from", + "task":"translation_to", "metric":"bleu", - "score":0.1358560869, - "sentence_nr":9 + "score":0.1284176951 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"microsoft\/phi-4", "bcp_47":"sw", - "task":"translation_from", + "task":"translation_to", "metric":"chrf", - "score":0.2460209347, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 + "score":0.4471488498 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.0147491229, - "sentence_nr":9 + "model":"microsoft\/phi-4", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"microsoft\/phi-4", + "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":9 + "score":0.1221237902 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"microsoft\/phi-4", + "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.2390985318, - "sentence_nr":9 + "score":0.3753302424 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", + "model":"microsoft\/phi-4", + "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.6358921903, - "sentence_nr":0 + "score":0.1342135875 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", + "model":"microsoft\/phi-4", + "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.8041899227, - "sentence_nr":0 + "score":0.3921252544 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", + "model":"microsoft\/phi-4", + "bcp_47":"ur", + "task":"translation_from", "metric":"bleu", - "score":0.6299285159, - "sentence_nr":0 + "score":0.1013597082 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", + "model":"microsoft\/phi-4", + "bcp_47":"ur", + "task":"translation_from", "metric":"chrf", - "score":0.7993134129, - "sentence_nr":0 + "score":0.3226565783 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", + "model":"microsoft\/phi-4", + "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.710159574, - "sentence_nr":0 + "score":0.1055049805 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", + "model":"microsoft\/phi-4", + "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.8462481748, - "sentence_nr":0 + "score":0.3270359823 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", + "model":"microsoft\/phi-4", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"microsoft\/phi-4", + "bcp_47":"vi", + "task":"translation_from", "metric":"bleu", - "score":0.5487830137, - "sentence_nr":0 + "score":0.1212000479 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", + "model":"microsoft\/phi-4", + "bcp_47":"vi", + "task":"translation_from", "metric":"chrf", - "score":0.7723896504, - "sentence_nr":0 + "score":0.3499332758 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", + "model":"microsoft\/phi-4", + "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.5375319287, - "sentence_nr":0 + "score":0.2215772318 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", + "model":"microsoft\/phi-4", + "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.7826716937, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3505907645, - "sentence_nr":0 + "score":0.4885306046 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"microsoft\/phi-4", "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4021980348, - "sentence_nr":0 + "task":"mmlu", + "metric":"accuracy", + "score":0.8 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"microsoft\/phi-4", "bcp_47":"zh", - "task":"translation_to", + "task":"translation_from", "metric":"bleu", - "score":0.4131612771, - "sentence_nr":0 + "score":0.1515209994 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"microsoft\/phi-4", "bcp_47":"zh", - "task":"translation_to", + "task":"translation_from", "metric":"chrf", - "score":0.4430321339, - "sentence_nr":0 + "score":0.4261650622 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"microsoft\/phi-4", "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.3993284843, - "sentence_nr":0 + "score":0.1646480678 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"microsoft\/phi-4", "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.4224738565, - "sentence_nr":0 + "score":0.2556911118 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ar", + "task":"translation_from", "metric":"bleu", - "score":0.2908087026, - "sentence_nr":0 + "score":0.12805161 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ar", + "task":"translation_from", "metric":"chrf", - "score":0.34113614, - "sentence_nr":0 + "score":0.3001336989 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.3686151885, - "sentence_nr":0 + "score":0.1701118305 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.3858999291, - "sentence_nr":0 + "score":0.2705414464 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"bn", + "task":"translation_from", "metric":"bleu", - "score":0.8780634321, - "sentence_nr":0 + "score":0.0274986656 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"bn", + "task":"translation_from", "metric":"chrf", - "score":0.9269467001, - "sentence_nr":0 + "score":0.2715478832 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.7964573358, - "sentence_nr":0 + "score":0.0364128057 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.8458636472, - "sentence_nr":0 + "score":0.1916781774 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"de", + "task":"translation_from", "metric":"bleu", - "score":1.0, - "sentence_nr":0 + "score":0.1092874906 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"de", + "task":"translation_from", "metric":"chrf", - "score":1.0, - "sentence_nr":0 + "score":0.3511512521 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.9452996323, - "sentence_nr":0 + "score":0.1229942688 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.9463396364, - "sentence_nr":0 + "score":0.3801618008 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"en", + "task":"translation_from", "metric":"bleu", - "score":0.8781548422, - "sentence_nr":0 + "score":0.3724031885 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"en", + "task":"translation_from", "metric":"chrf", - "score":0.9156314785, - "sentence_nr":0 + "score":0.5022830131 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.4067397119, - "sentence_nr":0 + "score":0.4547673266 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.6897190926, - "sentence_nr":0 + "score":0.6611296308 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"es", - "task":"translation_to", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"es", + "task":"translation_from", "metric":"bleu", - "score":0.3707525915, - "sentence_nr":0 + "score":0.1090053669 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"es", - "task":"translation_to", + "task":"translation_from", "metric":"chrf", - "score":0.6481906762, - "sentence_nr":0 + "score":0.3312266479 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.4405434566, - "sentence_nr":0 + "score":0.2527998075 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"microsoft\/phi-4-multimodal-instruct", "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.6872423435, - "sentence_nr":0 + "score":0.4585982852 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"fr", + "task":"translation_from", "metric":"bleu", - "score":0.340705194, - "sentence_nr":0 + "score":0.0725417811 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"fr", + "task":"translation_from", "metric":"chrf", - "score":0.6376396417, - "sentence_nr":0 + "score":0.2990918671 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.3134536528, - "sentence_nr":0 + "score":0.2151316826 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.6269464695, - "sentence_nr":0 + "score":0.4131412973 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"hi", + "task":"translation_from", "metric":"bleu", - "score":0.7033737197, - "sentence_nr":0 + "score":0.1923702178 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"hi", + "task":"translation_from", "metric":"chrf", - "score":0.7784050705, - "sentence_nr":0 + "score":0.4177039104 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.4699587339, - "sentence_nr":0 + "score":0.1946792857 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.584375606, - "sentence_nr":0 + "score":0.3652693419 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"id", + "task":"translation_from", "metric":"bleu", - "score":0.6034601376, - "sentence_nr":0 + "score":0.141847306 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"id", + "task":"translation_from", "metric":"chrf", - "score":0.7074074363, - "sentence_nr":0 + "score":0.3708481852 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.520069265, - "sentence_nr":0 + "score":0.0995355066 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.6586847274, - "sentence_nr":0 + "score":0.3111314573 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ja", + "task":"translation_from", "metric":"bleu", - "score":0.5176708393, - "sentence_nr":0 + "score":0.2032657995 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ja", + "task":"translation_from", "metric":"chrf", - "score":0.6443244311, - "sentence_nr":0 + "score":0.3735202727 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.3489926819, - "sentence_nr":0 + "score":0.2250820799 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.5715668842, - "sentence_nr":0 + "score":0.3303987825 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"jv", + "task":"translation_from", "metric":"bleu", - "score":0.2786169605, - "sentence_nr":0 + "score":0.0965458717 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"jv", + "task":"translation_from", "metric":"chrf", - "score":0.5267252236, - "sentence_nr":0 + "score":0.2876791143 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.3544632222, - "sentence_nr":0 + "score":0.0955767676 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.5208748527, - "sentence_nr":0 + "score":0.2170187808 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"mr", + "task":"translation_from", "metric":"bleu", - "score":0.2679728612, - "sentence_nr":0 + "score":0.0250471784 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"mr", + "task":"translation_from", "metric":"chrf", - "score":0.4666913728, - "sentence_nr":0 + "score":0.191193874 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.3244555847, - "sentence_nr":0 + "score":0.0430511796 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.5576074375, - "sentence_nr":0 + "score":0.2530147609 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pa", + "task":"translation_from", "metric":"bleu", - "score":0.341024469, - "sentence_nr":0 + "score":0.2939382507 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pa", + "task":"translation_from", "metric":"chrf", - "score":0.5816669417, - "sentence_nr":0 + "score":0.4236905058 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.4234343012, - "sentence_nr":0 + "score":0.2038997189 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.6625289906, - "sentence_nr":0 + "score":0.3029720916 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pt", + "task":"translation_from", "metric":"bleu", - "score":0.3885765192, - "sentence_nr":0 + "score":0.1164585656 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pt", + "task":"translation_from", "metric":"chrf", - "score":0.6554470157, - "sentence_nr":0 + "score":0.3513786374 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.381088643, - "sentence_nr":0 + "score":0.1159124937 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.6485553379, - "sentence_nr":0 + "score":0.3709389273 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ru", + "task":"translation_from", "metric":"bleu", - "score":0.3602811871, - "sentence_nr":0 + "score":0.0726892156 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ru", + "task":"translation_from", "metric":"chrf", - "score":0.6460863746, - "sentence_nr":0 + "score":0.2863134478 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.4324680012, - "sentence_nr":0 + "score":0.1856825973 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.5877600879, - "sentence_nr":0 + "score":0.4059546251 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sw", + "task":"translation_from", "metric":"bleu", - "score":0.4493940084, - "sentence_nr":0 + "score":0.0285853745 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sw", + "task":"translation_from", "metric":"chrf", - "score":0.6230960824, - "sentence_nr":0 + "score":0.258743147 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.4116575553, - "sentence_nr":0 + "score":0.025156184 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.5665759692, - "sentence_nr":0 + "score":0.1783483023 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"te", + "task":"translation_from", "metric":"bleu", - "score":0.3533147318, - "sentence_nr":0 + "score":0.0776108509 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"te", + "task":"translation_from", "metric":"chrf", - "score":0.5972951641, - "sentence_nr":0 + "score":0.2968212875 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.4771981138, - "sentence_nr":0 + "score":0.0381758727 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.6315763749, - "sentence_nr":0 + "score":0.2127544397 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ur", + "task":"translation_from", "metric":"bleu", - "score":0.6947677374, - "sentence_nr":0 + "score":0.0750463099 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ur", + "task":"translation_from", "metric":"chrf", - "score":0.7941300667, - "sentence_nr":0 + "score":0.2214284722 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.6412098672, - "sentence_nr":0 + "score":0.070850694 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.7665040244, - "sentence_nr":0 + "score":0.2944265552 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"vi", + "task":"translation_from", "metric":"bleu", - "score":0.6045639361, - "sentence_nr":0 + "score":0.0771444238 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"vi", + "task":"translation_from", "metric":"chrf", - "score":0.7576570568, - "sentence_nr":0 + "score":0.2978139061 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.5438238038, - "sentence_nr":0 + "score":0.0799080562 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.7060850658, - "sentence_nr":0 + "score":0.2533330302 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"zh", + "task":"translation_from", "metric":"bleu", - "score":0.6197738787, - "sentence_nr":0 + "score":0.0844065166 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"zh", + "task":"translation_from", "metric":"chrf", - "score":0.7658055016, - "sentence_nr":0 + "score":0.3102353728 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.3861375213, - "sentence_nr":0 + "score":0.1424724277 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", + "model":"microsoft\/phi-4-multimodal-instruct", + "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.5122109329, - "sentence_nr":0 + "score":0.1997648583 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"ar", + "task":"translation_from", "metric":"bleu", - "score":0.3253992126, - "sentence_nr":0 + "score":0.1411079383 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ar", + "task":"translation_from", "metric":"chrf", - "score":0.5133457276, - "sentence_nr":0 + "score":0.4288778553 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.3750795127, - "sentence_nr":0 + "score":0.0953750383 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.5371301483, - "sentence_nr":0 + "score":0.3064512757 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"bn", + "task":"translation_from", "metric":"bleu", - "score":0.4845646373, - "sentence_nr":0 + "score":0.1056007136 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"bn", + "task":"translation_from", "metric":"chrf", - "score":0.5906105669, - "sentence_nr":0 + "score":0.3471561552 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", + "model":"mistralai\/mistral-nemo", + "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.4092755331, - "sentence_nr":0 + "score":0.1826317159 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", + "model":"mistralai\/mistral-nemo", + "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.5662949759, - "sentence_nr":0 + "score":0.4009621221 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"de", + "task":"translation_from", "metric":"bleu", - "score":0.4354194543, - "sentence_nr":0 + "score":0.1779380635 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"de", + "task":"translation_from", "metric":"chrf", - "score":0.665617533, - "sentence_nr":0 + "score":0.4500965094 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-nemo", + "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.5941815558, - "sentence_nr":0 + "score":0.2121723095 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-nemo", + "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.7983203559, - "sentence_nr":0 + "score":0.5030225058 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"en", + "task":"translation_from", "metric":"bleu", - "score":0.4524360013, - "sentence_nr":0 + "score":0.3044634871 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"en", + "task":"translation_from", "metric":"chrf", - "score":0.6715594087, - "sentence_nr":0 + "score":0.5185245123 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-nemo", + "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.335542878, - "sentence_nr":0 + "score":0.4511358274 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-nemo", + "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.6348737823, - "sentence_nr":0 + "score":0.7059119826 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"es", + "task":"translation_from", "metric":"bleu", - "score":0.5203658198, - "sentence_nr":0 + "score":0.1945088953 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"es", + "task":"translation_from", "metric":"chrf", - "score":0.7286515973, - "sentence_nr":0 + "score":0.4507966567 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", + "model":"mistralai\/mistral-nemo", + "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.398304592, - "sentence_nr":0 + "score":0.3128110525 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", + "model":"mistralai\/mistral-nemo", + "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.6521777109, - "sentence_nr":0 + "score":0.564309507 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"fr", + "task":"translation_from", "metric":"bleu", - "score":0.2682038772, - "sentence_nr":0 + "score":0.1503854665 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fr", + "task":"translation_from", "metric":"chrf", - "score":0.5791297455, - "sentence_nr":0 + "score":0.4086984161 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.2276653674, - "sentence_nr":0 + "score":0.4089231963 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", + "model":"mistralai\/mistral-nemo", + "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.5321260121, - "sentence_nr":0 + "score":0.6185522756 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"hi", + "task":"translation_from", "metric":"bleu", - "score":0.1498185575, - "sentence_nr":0 + "score":0.2552169122 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"hi", + "task":"translation_from", "metric":"chrf", - "score":0.5073561651, - "sentence_nr":0 + "score":0.473817666 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"mistralai\/mistral-nemo", + "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.3776712971, - "sentence_nr":0 + "score":0.245531449 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"mistralai\/mistral-nemo", + "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.6263797337, - "sentence_nr":0 + "score":0.49602593 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"id", + "task":"translation_from", "metric":"bleu", - "score":0.3880515885, - "sentence_nr":1 + "score":0.183278736 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"id", + "task":"translation_from", "metric":"chrf", - "score":0.6587916716, - "sentence_nr":1 + "score":0.4259117743 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-nemo", + "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.5142726846, - "sentence_nr":1 + "score":0.1644315134 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-nemo", + "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.7344716263, - "sentence_nr":1 + "score":0.4582343316 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"ja", + "task":"translation_from", "metric":"bleu", - "score":0.6066498621, - "sentence_nr":1 + "score":0.2091363742 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ja", + "task":"translation_from", "metric":"chrf", - "score":0.7812137754, - "sentence_nr":1 + "score":0.4571081356 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.4342750765, - "sentence_nr":1 + "score":0.1736443062 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.7115011222, - "sentence_nr":1 + "score":0.2944908594 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"jv", + "task":"translation_from", "metric":"bleu", - "score":0.3893969298, - "sentence_nr":1 + "score":0.1871758781 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"jv", + "task":"translation_from", "metric":"chrf", - "score":0.6629460107, - "sentence_nr":1 + "score":0.3534639201 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", + "model":"mistralai\/mistral-nemo", + "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.4487746168, - "sentence_nr":1 + "score":0.1246961548 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", + "model":"mistralai\/mistral-nemo", + "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.4476730201, - "sentence_nr":1 + "score":0.3016674377 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"mr", + "task":"translation_from", "metric":"bleu", - "score":0.28366234, - "sentence_nr":1 + "score":0.1225817213 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"mr", + "task":"translation_from", "metric":"chrf", - "score":0.2914733724, - "sentence_nr":1 + "score":0.3113005758 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-nemo", + "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.2775905064, - "sentence_nr":1 + "score":0.1352680788 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", + "model":"mistralai\/mistral-nemo", + "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.316576728, - "sentence_nr":1 + "score":0.2974034458 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"pa", + "task":"translation_from", "metric":"bleu", - "score":0.2891243295, - "sentence_nr":1 + "score":0.3657744488 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"pa", + "task":"translation_from", "metric":"chrf", - "score":0.3111960394, - "sentence_nr":1 + "score":0.5584856442 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", + "model":"mistralai\/mistral-nemo", + "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.3679317258, - "sentence_nr":1 + "score":0.2676684918 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", + "model":"mistralai\/mistral-nemo", + "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.3623820326, - "sentence_nr":1 + "score":0.4408840729 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"pt", + "task":"translation_from", "metric":"bleu", - "score":0.2113054108, - "sentence_nr":1 + "score":0.1448893824 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"pt", + "task":"translation_from", "metric":"chrf", - "score":0.4423822999, - "sentence_nr":1 + "score":0.4141759018 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", + "model":"mistralai\/mistral-nemo", + "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.2620790359, - "sentence_nr":1 + "score":0.3802451797 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", + "model":"mistralai\/mistral-nemo", + "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.5007312322, - "sentence_nr":1 + "score":0.5985788184 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"ru", + "task":"translation_from", "metric":"bleu", - "score":0.1609807304, - "sentence_nr":1 + "score":0.1462210673 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ru", + "task":"translation_from", "metric":"chrf", - "score":0.3971037508, - "sentence_nr":1 + "score":0.4241453806 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.1146562315, - "sentence_nr":1 + "score":0.2074330919 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.4497512969, - "sentence_nr":1 + "score":0.4438291243 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"sw", + "task":"translation_from", "metric":"bleu", - "score":0.2035086444, - "sentence_nr":1 + "score":0.0700151652 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sw", + "task":"translation_from", "metric":"chrf", - "score":0.4226564278, - "sentence_nr":1 + "score":0.267224603 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.4556160154, - "sentence_nr":1 + "score":0.0414991243 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", + "model":"mistralai\/mistral-nemo", + "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.6661994452, - "sentence_nr":1 + "score":0.3151327738 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"te", + "task":"translation_from", "metric":"bleu", - "score":0.321675602, - "sentence_nr":1 + "score":0.0841044753 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"te", + "task":"translation_from", "metric":"chrf", - "score":0.6141241026, - "sentence_nr":1 + "score":0.3329048731 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-nemo", + "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.4336904847, - "sentence_nr":1 + "score":0.1093199271 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-nemo", + "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.6586872889, - "sentence_nr":1 + "score":0.3565208631 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ur", + "task":"translation_from", "metric":"bleu", - "score":0.4098419225, - "sentence_nr":1 + "score":0.0712938477 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ur", + "task":"translation_from", "metric":"chrf", - "score":0.6358736384, - "sentence_nr":1 + "score":0.34111588 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.3916220735, - "sentence_nr":1 + "score":0.1282666873 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", + "model":"mistralai\/mistral-nemo", + "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.6550784354, - "sentence_nr":1 + "score":0.355242737 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"vi", + "task":"translation_from", "metric":"bleu", - "score":0.3757080934, - "sentence_nr":1 + "score":0.1008653377 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"vi", + "task":"translation_from", "metric":"chrf", - "score":0.6339141735, - "sentence_nr":1 + "score":0.3602737727 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-nemo", + "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.5593324226, - "sentence_nr":1 + "score":0.0837032908 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-nemo", + "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.7332911901, - "sentence_nr":1 + "score":0.2497686258 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"mistralai\/mistral-nemo", + "bcp_47":"zh", + "task":"translation_from", "metric":"bleu", - "score":0.4845738245, - "sentence_nr":1 + "score":0.1835816123 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", + "model":"mistralai\/mistral-nemo", + "bcp_47":"zh", + "task":"translation_from", "metric":"chrf", - "score":0.7144409873, - "sentence_nr":1 + "score":0.4240772425 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-nemo", + "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.4881942815, - "sentence_nr":1 + "score":0.1204225303 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-nemo", + "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.6662053432, - "sentence_nr":1 + "score":0.2073656478 }, { - "model":"openai\/gpt-4.1-mini", + "model":"mistralai\/mistral-saba", "bcp_47":"ar", - "task":"translation_to", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"ar", + "task":"translation_from", "metric":"bleu", - "score":0.4577386766, - "sentence_nr":1 + "score":0.2307115512 }, { - "model":"openai\/gpt-4.1-mini", + "model":"mistralai\/mistral-saba", "bcp_47":"ar", - "task":"translation_to", + "task":"translation_from", "metric":"chrf", - "score":0.6531477301, - "sentence_nr":1 + "score":0.4984040511 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", + "model":"mistralai\/mistral-saba", + "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.3446592077, - "sentence_nr":1 + "score":0.3687026411 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", + "model":"mistralai\/mistral-saba", + "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.5819912584, - "sentence_nr":1 + "score":0.5939572307 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"bn", + "task":"translation_from", "metric":"bleu", - "score":0.232709381, - "sentence_nr":1 + "score":0.2038963891 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"bn", + "task":"translation_from", "metric":"chrf", - "score":0.4490269267, - "sentence_nr":1 + "score":0.4710421194 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-saba", + "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":1 + "score":0.3131013355 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-saba", + "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.1163446833, - "sentence_nr":1 + "score":0.4896188194 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"de", + "task":"translation_from", "metric":"bleu", - "score":0.1766119945, - "sentence_nr":1 + "score":0.2711678576 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"de", + "task":"translation_from", "metric":"chrf", - "score":0.3986479587, - "sentence_nr":1 + "score":0.5010413002 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", + "model":"mistralai\/mistral-saba", + "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.365728408, - "sentence_nr":1 + "score":0.3851397268 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", + "model":"mistralai\/mistral-saba", + "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.5794132414, - "sentence_nr":1 + "score":0.6299318639 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"en", + "task":"translation_from", "metric":"bleu", - "score":0.5295277583, - "sentence_nr":1 + "score":0.3971499204 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"en", + "task":"translation_from", "metric":"chrf", - "score":0.6540432511, - "sentence_nr":1 + "score":0.5704846467 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-saba", + "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.4970423291, - "sentence_nr":1 + "score":0.5236846455 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-saba", + "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.6453248294, - "sentence_nr":1 + "score":0.750594995 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"es", + "task":"translation_from", "metric":"bleu", - "score":0.4970423291, - "sentence_nr":1 + "score":0.2325003342 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"es", + "task":"translation_from", "metric":"chrf", - "score":0.6453248294, - "sentence_nr":1 + "score":0.4556556517 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-saba", + "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.5494410974, - "sentence_nr":1 + "score":0.2894670078 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-saba", + "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.6853937472, - "sentence_nr":1 + "score":0.552498138 }, { - "model":"openai\/gpt-4.1-mini", + "model":"mistralai\/mistral-saba", "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.464523041, - "sentence_nr":1 + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"openai\/gpt-4.1-mini", + "model":"mistralai\/mistral-saba", "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6240758264, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", + "task":"translation_from", "metric":"bleu", - "score":0.3479698394, - "sentence_nr":1 + "score":0.1905858019 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"fr", + "task":"translation_from", "metric":"chrf", - "score":0.5760833126, - "sentence_nr":1 + "score":0.4419502294 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-saba", + "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.2437325371, - "sentence_nr":1 + "score":0.4778596825 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-saba", + "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.4948203921, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3120506351, - "sentence_nr":1 + "score":0.6586250533 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5390444512, - "sentence_nr":1 + "model":"mistralai\/mistral-saba", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"hi", + "task":"translation_from", "metric":"bleu", - "score":0.2422988979, - "sentence_nr":1 + "score":0.3285111598 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"hi", + "task":"translation_from", "metric":"chrf", - "score":0.4853505496, - "sentence_nr":1 + "score":0.5456949766 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", + "model":"mistralai\/mistral-saba", + "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.2759710526, - "sentence_nr":1 + "score":0.3807039375 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", + "model":"mistralai\/mistral-saba", + "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.5468536897, - "sentence_nr":1 + "score":0.5585736378 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"id", + "task":"translation_from", "metric":"bleu", - "score":0.298869704, - "sentence_nr":1 + "score":0.266611987 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"id", + "task":"translation_from", "metric":"chrf", - "score":0.544252266, - "sentence_nr":1 + "score":0.4806521836 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-saba", + "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.5007036357, - "sentence_nr":1 + "score":0.280362444 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-saba", + "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.6501904887, - "sentence_nr":1 + "score":0.5856798399 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"ja", + "task":"translation_from", "metric":"bleu", - "score":0.487646318, - "sentence_nr":1 + "score":0.2716028557 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"ja", + "task":"translation_from", "metric":"chrf", - "score":0.6113405964, - "sentence_nr":1 + "score":0.5228700434 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-saba", + "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.5199813504, - "sentence_nr":1 + "score":0.2362873295 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-saba", + "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.6584629523, - "sentence_nr":1 + "score":0.3988160859 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"jv", + "task":"translation_from", "metric":"bleu", - "score":0.4743196503, - "sentence_nr":1 + "score":0.1351110513 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"jv", + "task":"translation_from", "metric":"chrf", - "score":0.6291489876, - "sentence_nr":1 + "score":0.3282404022 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", + "model":"mistralai\/mistral-saba", + "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.4333022325, - "sentence_nr":1 + "score":0.1135047432 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", + "model":"mistralai\/mistral-saba", + "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.556449953, - "sentence_nr":1 + "score":0.3702437183 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"mr", + "task":"translation_from", "metric":"bleu", - "score":0.1466607446, - "sentence_nr":1 + "score":0.2524012374 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"mr", + "task":"translation_from", "metric":"chrf", - "score":0.3655296382, - "sentence_nr":1 + "score":0.4786192289 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-saba", + "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.2052749403, - "sentence_nr":1 + "score":0.2105658138 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-saba", + "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.4358647505, - "sentence_nr":1 + "score":0.4350780053 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"pa", - "task":"translation_to", + "task":"translation_from", "metric":"bleu", - "score":0.3047577636, - "sentence_nr":1 + "score":0.3889163911 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"pa", - "task":"translation_to", + "task":"translation_from", "metric":"chrf", - "score":0.483185127, - "sentence_nr":1 + "score":0.5826179394 }, { - "model":"openai\/gpt-4.1-mini", + "model":"mistralai\/mistral-saba", "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.2580795409, - "sentence_nr":1 + "score":0.3921555968 }, { - "model":"openai\/gpt-4.1-mini", + "model":"mistralai\/mistral-saba", "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.4391402666, - "sentence_nr":1 + "score":0.5536315548 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"pt", + "task":"translation_from", "metric":"bleu", - "score":0.418078222, - "sentence_nr":1 + "score":0.2943696763 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"pt", + "task":"translation_from", "metric":"chrf", - "score":0.5775458912, - "sentence_nr":1 + "score":0.5224446861 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-saba", + "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.3475258894, - "sentence_nr":1 + "score":0.4674713564 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-saba", + "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.5729813197, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4610791065, - "sentence_nr":1 + "score":0.6782176965 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5982792042, - "sentence_nr":1 + "task":"mmlu", + "metric":"accuracy", + "score":0.8 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"ru", - "task":"translation_to", + "task":"translation_from", "metric":"bleu", - "score":0.4642320267, - "sentence_nr":1 + "score":0.1704112037 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"ru", - "task":"translation_to", + "task":"translation_from", "metric":"chrf", - "score":0.6555816107, - "sentence_nr":1 + "score":0.4377240493 }, { - "model":"openai\/gpt-4.1-mini", + "model":"mistralai\/mistral-saba", "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":1 + "score":0.2666948821 }, { - "model":"openai\/gpt-4.1-mini", + "model":"mistralai\/mistral-saba", "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.0007348618, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2023879631, - "sentence_nr":1 + "score":0.4926215679 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"mistralai\/mistral-saba", "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5665467523, - "sentence_nr":1 + "task":"mmlu", + "metric":"accuracy", + "score":0.6 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"sw", - "task":"translation_to", + "task":"translation_from", "metric":"bleu", - "score":0.4612469192, - "sentence_nr":1 + "score":0.07741038 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"sw", - "task":"translation_to", + "task":"translation_from", "metric":"chrf", - "score":0.6895404842, - "sentence_nr":1 + "score":0.2658688973 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.4688149932, - "sentence_nr":1 + "score":0.1116660561 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.6935921005, - "sentence_nr":1 + "score":0.4225621416 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"mistralai\/mistral-saba", + "bcp_47":"te", + "task":"translation_from", "metric":"bleu", - "score":0.3190700151, - "sentence_nr":1 + "score":0.3226731558 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"te", + "task":"translation_from", "metric":"chrf", - "score":0.6396787125, - "sentence_nr":1 + "score":0.4991511328 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"mistralai\/mistral-saba", + "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.4257525491, - "sentence_nr":1 + "score":0.2633784516 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"mistralai\/mistral-saba", + "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.6704469753, - "sentence_nr":1 + "score":0.4918671935 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"ur", + "task":"translation_from", "metric":"bleu", - "score":0.7017829861, - "sentence_nr":2 + "score":0.1788289199 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"ur", + "task":"translation_from", "metric":"chrf", - "score":0.7743327022, - "sentence_nr":2 + "score":0.4270187713 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-saba", + "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.6961795372, - "sentence_nr":2 + "score":0.2622858638 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", + "model":"mistralai\/mistral-saba", + "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.7859480663, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5643442092, - "sentence_nr":2 + "score":0.4513610959 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7005543453, - "sentence_nr":2 + "model":"mistralai\/mistral-saba", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"vi", + "task":"translation_from", "metric":"bleu", - "score":0.543231275, - "sentence_nr":2 + "score":0.1261643561 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", + "model":"mistralai\/mistral-saba", + "bcp_47":"vi", + "task":"translation_from", "metric":"chrf", - "score":0.6677259865, - "sentence_nr":2 + "score":0.3351014303 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", + "model":"mistralai\/mistral-saba", + "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.7108042923, - "sentence_nr":2 + "score":0.2593001367 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", + "model":"mistralai\/mistral-saba", + "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.8180084375, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1411835006, - "sentence_nr":2 + "score":0.5207002255 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"mistralai\/mistral-saba", "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2043183778, - "sentence_nr":2 + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"zh", - "task":"translation_to", + "task":"translation_from", "metric":"bleu", - "score":0.1811004938, - "sentence_nr":2 + "score":0.2331909906 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"zh", - "task":"translation_to", + "task":"translation_from", "metric":"chrf", - "score":0.2649993137, - "sentence_nr":2 + "score":0.4659908973 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.1408901109, - "sentence_nr":2 + "score":0.2401879449 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"mistralai\/mistral-saba", "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.2194460381, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 + "score":0.2984854823 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1250181903, - "sentence_nr":2 + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ar", + "task":"translation_from", "metric":"bleu", - "score":0.2634990041, - "sentence_nr":2 + "score":0.1538277929 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ar", + "task":"translation_from", "metric":"chrf", - "score":0.3107963896, - "sentence_nr":2 + "score":0.4198691069 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.2072192435, - "sentence_nr":2 + "score":0.2808764056 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.3647593219, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1138660795, - "sentence_nr":2 + "score":0.4945291951 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3356458335, - "sentence_nr":2 + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"bn", + "task":"translation_from", "metric":"bleu", - "score":0.1686235632, - "sentence_nr":2 + "score":0.1503587087 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"bn", + "task":"translation_from", "metric":"chrf", - "score":0.3637462812, - "sentence_nr":2 + "score":0.3519203949 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":2 + "score":0.1971487973 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.1485432117, - "sentence_nr":2 + "score":0.3802325565 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"de", + "task":"translation_from", "metric":"bleu", - "score":0.2759460538, - "sentence_nr":2 + "score":0.2282524895 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"de", + "task":"translation_from", "metric":"chrf", - "score":0.4266832189, - "sentence_nr":2 + "score":0.4762659907 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.464426437, - "sentence_nr":2 + "score":0.310849797 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.5519480629, - "sentence_nr":2 + "score":0.5162495445 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"en", + "task":"translation_from", "metric":"bleu", - "score":0.626894179, - "sentence_nr":2 + "score":0.3862933118 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"en", + "task":"translation_from", "metric":"chrf", - "score":0.6958291103, - "sentence_nr":2 + "score":0.5649666335 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.4554740717, - "sentence_nr":2 + "score":0.4654982999 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.549876635, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3581781081, - "sentence_nr":2 + "score":0.6658845521 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"mistralai\/mistral-small-3.1-24b-instruct", "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5012707041, - "sentence_nr":2 + "task":"mmlu", + "metric":"accuracy", + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", + "model":"mistralai\/mistral-small-3.1-24b-instruct", "bcp_47":"es", - "task":"translation_to", + "task":"translation_from", "metric":"bleu", - "score":0.6297960259, - "sentence_nr":2 + "score":0.153039152 }, { - "model":"openai\/gpt-4.1-mini", + "model":"mistralai\/mistral-small-3.1-24b-instruct", "bcp_47":"es", - "task":"translation_to", + "task":"translation_from", "metric":"chrf", - "score":0.7117676662, - "sentence_nr":2 + "score":0.3787678566 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.2283768002, - "sentence_nr":2 + "score":0.2956525612 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.4416418023, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4151474543, - "sentence_nr":2 + "score":0.5355759847 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6389524687, - "sentence_nr":2 + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fr", + "task":"translation_from", "metric":"bleu", - "score":0.4355097603, - "sentence_nr":2 + "score":0.2366178299 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fr", + "task":"translation_from", "metric":"chrf", - "score":0.6511365998, - "sentence_nr":2 + "score":0.496953378 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.2468185992, - "sentence_nr":2 + "score":0.4332629029 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.4679216763, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4295348441, - "sentence_nr":2 + "score":0.6444037956 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.623113134, - "sentence_nr":2 + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"hi", + "task":"translation_from", "metric":"bleu", - "score":0.1163412939, - "sentence_nr":2 + "score":0.2794593031 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"hi", + "task":"translation_from", "metric":"chrf", - "score":0.315309023, - "sentence_nr":2 + "score":0.5163454129 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.195447958, - "sentence_nr":2 + "score":0.3170576155 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.3835451744, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.198893335, - "sentence_nr":2 + "score":0.5211214847 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3885583773, - "sentence_nr":2 + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"id", + "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":2 + "score":0.1707579789 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"id", + "task":"translation_from", "metric":"chrf", - "score":0.244801029, - "sentence_nr":2 + "score":0.4033109614 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.1768354493, - "sentence_nr":2 + "score":0.2188248408 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.3684372572, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.359355104, - "sentence_nr":2 + "score":0.5492911343 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5589602235, - "sentence_nr":2 + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ja", + "task":"translation_from", "metric":"bleu", - "score":0.4267520229, - "sentence_nr":2 + "score":0.2285487924 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ja", + "task":"translation_from", "metric":"chrf", - "score":0.5518115367, - "sentence_nr":2 + "score":0.471295757 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.4248870612, - "sentence_nr":2 + "score":0.3374389141 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.5641041633, - "sentence_nr":2 + "score":0.454206736 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"jv", + "task":"translation_from", "metric":"bleu", - "score":0.4042942963, - "sentence_nr":2 + "score":0.1830822648 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"jv", + "task":"translation_from", "metric":"chrf", - "score":0.5757999868, - "sentence_nr":2 + "score":0.3748256188 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.4538153281, - "sentence_nr":2 + "score":0.156719726 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.5943177067, - "sentence_nr":2 + "score":0.3565335339 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"mr", + "task":"translation_from", "metric":"bleu", - "score":0.3555103419, - "sentence_nr":2 + "score":0.1396612724 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"mr", + "task":"translation_from", "metric":"chrf", - "score":0.5627284646, - "sentence_nr":2 + "score":0.3788068496 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.5039752491, - "sentence_nr":2 + "score":0.1238899835 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.6136695013, - "sentence_nr":2 + "score":0.3481069187 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"pa", + "task":"translation_from", "metric":"bleu", - "score":0.3693229588, - "sentence_nr":2 + "score":0.3486285299 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"pa", + "task":"translation_from", "metric":"chrf", - "score":0.5524455185, - "sentence_nr":2 + "score":0.5488183895 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.0803311992, - "sentence_nr":2 + "score":0.3765245892 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.2302164129, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3284978808, - "sentence_nr":2 + "score":0.5298772939 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4983088157, - "sentence_nr":2 + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"mistralai\/mistral-small-3.1-24b-instruct", "bcp_47":"pt", - "task":"translation_to", + "task":"translation_from", "metric":"bleu", - "score":0.5088535943, - "sentence_nr":2 + "score":0.1859039826 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"mistralai\/mistral-small-3.1-24b-instruct", "bcp_47":"pt", - "task":"translation_to", + "task":"translation_from", "metric":"chrf", - "score":0.6252025968, - "sentence_nr":2 + "score":0.4364419603 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"mistralai\/mistral-small-3.1-24b-instruct", "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.5620488199, - "sentence_nr":2 + "score":0.3813303912 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"mistralai\/mistral-small-3.1-24b-instruct", "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.7192054484, - "sentence_nr":2 + "score":0.5887135238 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ru", + "task":"translation_from", "metric":"bleu", - "score":0.5550041554, - "sentence_nr":2 + "score":0.1311303005 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ru", + "task":"translation_from", "metric":"chrf", - "score":0.6554946147, - "sentence_nr":2 + "score":0.3844997287 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.440689626, - "sentence_nr":2 + "score":0.2777412876 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.5713280637, - "sentence_nr":2 + "score":0.4986551548 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sw", + "task":"translation_from", "metric":"bleu", - "score":0.5530531361, - "sentence_nr":2 + "score":0.123417194 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sw", + "task":"translation_from", "metric":"chrf", - "score":0.756238556, - "sentence_nr":2 + "score":0.3074793247 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.3941975149, - "sentence_nr":2 + "score":0.1862273327 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.519104648, - "sentence_nr":2 + "score":0.4964265847 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"te", + "task":"translation_from", "metric":"bleu", - "score":0.2626339401, - "sentence_nr":2 + "score":0.1871161773 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"te", + "task":"translation_from", "metric":"chrf", - "score":0.4192320655, - "sentence_nr":2 + "score":0.3959828918 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.3850172427, - "sentence_nr":2 + "score":0.1541981122 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.5264633431, - "sentence_nr":2 + "score":0.3534389775 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ur", + "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":2 + "score":0.1380435832 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ur", + "task":"translation_from", "metric":"chrf", - "score":0.1536323419, - "sentence_nr":2 + "score":0.3409229162 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.2697691813, - "sentence_nr":2 + "score":0.1042021716 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.4379048206, - "sentence_nr":2 + "score":0.3262262617 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"vi", + "task":"translation_from", "metric":"bleu", - "score":0.261816185, - "sentence_nr":2 + "score":0.1450000268 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"vi", + "task":"translation_from", "metric":"chrf", - "score":0.4694658943, - "sentence_nr":2 + "score":0.384195795 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.4395347892, - "sentence_nr":2 + "score":0.2211289124 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.6124294443, - "sentence_nr":2 + "score":0.4485571181 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"zh", + "task":"translation_from", "metric":"bleu", - "score":0.337115074, - "sentence_nr":2 + "score":0.1336281725 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"zh", + "task":"translation_from", "metric":"chrf", - "score":0.5683831732, - "sentence_nr":2 + "score":0.3849552359 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.3222423456, - "sentence_nr":2 + "score":0.2484908362 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", + "model":"mistralai\/mistral-small-3.1-24b-instruct", + "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.5643748238, - "sentence_nr":2 + "score":0.3028612614 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"ar", + "task":"translation_from", "metric":"bleu", - "score":0.3260557929, - "sentence_nr":2 + "score":0.1903586334 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"ar", + "task":"translation_from", "metric":"chrf", - "score":0.5464327823, - "sentence_nr":2 + "score":0.446387516 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.1313941359, - "sentence_nr":2 + "score":0.2809263669 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.2490406851, - "sentence_nr":2 + "score":0.4646534423 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"bn", + "task":"translation_from", "metric":"bleu", - "score":0.3112317272, - "sentence_nr":2 + "score":0.1096890189 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"bn", + "task":"translation_from", "metric":"chrf", - "score":0.436159773, - "sentence_nr":2 + "score":0.3793955783 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.3671734945, - "sentence_nr":2 + "score":0.1159907317 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.493827516, - "sentence_nr":2 + "score":0.3788984673 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"de", + "task":"translation_from", "metric":"bleu", - "score":0.3267949175, - "sentence_nr":2 + "score":0.2549144567 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"de", + "task":"translation_from", "metric":"chrf", - "score":0.5061357552, - "sentence_nr":2 + "score":0.4826972193 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.3784649355, - "sentence_nr":2 + "score":0.34224065 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.4712244356, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.8761560783, - "sentence_nr":3 + "score":0.5863783658 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"openai\/gpt-3.5-turbo", "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9484564543, - "sentence_nr":3 + "task":"mmlu", + "metric":"accuracy", + "score":0.8 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"openai\/gpt-3.5-turbo", "bcp_47":"en", - "task":"translation_to", + "task":"translation_from", "metric":"bleu", - "score":0.7505336183, - "sentence_nr":3 + "score":0.3883780582 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"openai\/gpt-3.5-turbo", "bcp_47":"en", - "task":"translation_to", + "task":"translation_from", "metric":"chrf", - "score":0.8401910628, - "sentence_nr":3 + "score":0.5704308494 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"openai\/gpt-3.5-turbo", "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.8761560783, - "sentence_nr":3 + "score":0.4668069531 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"openai\/gpt-3.5-turbo", "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.92894163, - "sentence_nr":3 + "score":0.672145186 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"es", + "task":"translation_from", "metric":"bleu", - "score":0.4450050658, - "sentence_nr":3 + "score":0.184032222 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"es", + "task":"translation_from", "metric":"chrf", - "score":0.7558874882, - "sentence_nr":3 + "score":0.4351218193 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.8107492451, - "sentence_nr":3 + "score":0.3557841931 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.9000327478, - "sentence_nr":3 + "score":0.5719636086 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"fr", + "task":"translation_from", "metric":"bleu", - "score":0.1345392715, - "sentence_nr":3 + "score":0.1916132677 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"fr", + "task":"translation_from", "metric":"chrf", - "score":0.1052297427, - "sentence_nr":3 + "score":0.4640172061 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.2205549369, - "sentence_nr":3 + "score":0.4034048767 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.3931965049, - "sentence_nr":3 + "score":0.5890628474 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"hi", + "task":"translation_from", "metric":"bleu", - "score":0.1375527487, - "sentence_nr":3 + "score":0.3160468813 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"hi", + "task":"translation_from", "metric":"chrf", - "score":0.1039771531, - "sentence_nr":3 + "score":0.5380845065 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.1389994121, - "sentence_nr":3 + "score":0.3086022651 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.1094730342, - "sentence_nr":3 + "score":0.503357724 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"id", + "task":"translation_from", "metric":"bleu", - "score":0.1372586106, - "sentence_nr":3 + "score":0.182638701 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"id", + "task":"translation_from", "metric":"chrf", - "score":0.1114738485, - "sentence_nr":3 + "score":0.4629618645 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.6885326215, - "sentence_nr":3 + "score":0.26058128 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.8229812189, - "sentence_nr":3 + "score":0.5416150753 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"ja", + "task":"translation_from", "metric":"bleu", - "score":0.8395876231, - "sentence_nr":3 + "score":0.2482898345 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"ja", + "task":"translation_from", "metric":"chrf", - "score":0.9096086669, - "sentence_nr":3 + "score":0.4829019738 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.7267072831, - "sentence_nr":3 + "score":0.3097130959 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.8396959978, - "sentence_nr":3 + "score":0.4348908804 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"jv", + "task":"translation_from", "metric":"bleu", - "score":0.6374950652, - "sentence_nr":3 + "score":0.1939894603 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"jv", + "task":"translation_from", "metric":"chrf", - "score":0.6643984253, - "sentence_nr":3 + "score":0.366697572 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.7608566263, - "sentence_nr":3 + "score":0.2131488291 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.881580297, - "sentence_nr":3 + "score":0.4853868303 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"mr", + "task":"translation_from", "metric":"bleu", - "score":0.3480442076, - "sentence_nr":3 + "score":0.1138885419 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"mr", + "task":"translation_from", "metric":"chrf", - "score":0.6142483233, - "sentence_nr":3 + "score":0.3670742528 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.2861853478, - "sentence_nr":3 + "score":0.1416518083 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.6401604433, - "sentence_nr":3 + "score":0.3217149096 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"pa", + "task":"translation_from", "metric":"bleu", - "score":0.2861853478, - "sentence_nr":3 + "score":0.2942498706 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"pa", + "task":"translation_from", "metric":"chrf", - "score":0.6401604433, - "sentence_nr":3 + "score":0.5514597671 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.2852636439, - "sentence_nr":3 + "score":0.3152534079 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.6732018003, - "sentence_nr":3 + "score":0.5017440919 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"pt", + "task":"translation_from", "metric":"bleu", - "score":0.1840992999, - "sentence_nr":3 + "score":0.2158772583 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"pt", + "task":"translation_from", "metric":"chrf", - "score":0.5294826056, - "sentence_nr":3 + "score":0.4780892551 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.1740151771, - "sentence_nr":3 + "score":0.4052445466 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.450062616, - "sentence_nr":3 + "score":0.6186215895 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"ru", + "task":"translation_from", "metric":"bleu", - "score":0.1512404438, - "sentence_nr":3 + "score":0.1501099752 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"ru", + "task":"translation_from", "metric":"chrf", - "score":0.4224869588, - "sentence_nr":3 + "score":0.4157469966 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.1512404438, - "sentence_nr":3 + "score":0.2685247919 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.4224869588, - "sentence_nr":3 + "score":0.4840654691 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"sw", + "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":3 + "score":0.1900353684 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"sw", + "task":"translation_from", "metric":"chrf", - "score":0.2686001166, - "sentence_nr":3 + "score":0.4405322363 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.1417229241, - "sentence_nr":3 + "score":0.2981157309 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.4762857001, - "sentence_nr":3 + "score":0.5535919581 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"te", + "task":"translation_from", "metric":"bleu", - "score":0.2028736642, - "sentence_nr":3 + "score":0.1437549858 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"te", + "task":"translation_from", "metric":"chrf", - "score":0.361485664, - "sentence_nr":3 + "score":0.3497530813 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.2255489037, - "sentence_nr":3 + "score":0.1088443126 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.395492575, - "sentence_nr":3 + "score":0.350662674 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"openai\/gpt-3.5-turbo", "bcp_47":"ur", - "task":"translation_to", + "task":"translation_from", "metric":"bleu", - "score":0.2927057122, - "sentence_nr":3 + "score":0.1592716898 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"openai\/gpt-3.5-turbo", "bcp_47":"ur", - "task":"translation_to", + "task":"translation_from", "metric":"chrf", - "score":0.4330945753, - "sentence_nr":3 + "score":0.4051863522 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"openai\/gpt-3.5-turbo", "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.18038303, - "sentence_nr":3 + "score":0.1515473933 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"openai\/gpt-3.5-turbo", "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.320678468, - "sentence_nr":3 + "score":0.3710678709 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2721438001, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4053920466, - "sentence_nr":3 + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"vi", + "task":"translation_from", "metric":"bleu", - "score":0.2929807168, - "sentence_nr":3 + "score":0.1245150014 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"vi", + "task":"translation_from", "metric":"chrf", - "score":0.597559507, - "sentence_nr":3 + "score":0.3649923323 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.6689604664, - "sentence_nr":3 + "score":0.1931933918 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.8010329765, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.6689604664, - "sentence_nr":3 + "score":0.397517622 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.8010329765, - "sentence_nr":3 + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"zh", + "task":"translation_from", "metric":"bleu", - "score":0.149089608, - "sentence_nr":3 + "score":0.1633023298 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"zh", + "task":"translation_from", "metric":"chrf", - "score":0.4761746966, - "sentence_nr":3 + "score":0.4277663973 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.3077874158, - "sentence_nr":3 + "score":0.2192873662 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", + "model":"openai\/gpt-3.5-turbo", + "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.5260758147, - "sentence_nr":3 + "score":0.2909960698 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"ar", + "task":"translation_from", "metric":"bleu", - "score":0.4113125177, - "sentence_nr":3 + "score":0.1829429954 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"ar", + "task":"translation_from", "metric":"chrf", - "score":0.4280807576, - "sentence_nr":3 + "score":0.4486992309 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.3268514139, - "sentence_nr":3 + "score":0.3288082098 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.3758692874, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3734832063, - "sentence_nr":3 + "score":0.5189698121 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"openai\/gpt-3.5-turbo-0613", "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3839166952, - "sentence_nr":3 + "task":"mmlu", + "metric":"accuracy", + "score":0.4 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"openai\/gpt-3.5-turbo-0613", "bcp_47":"bn", - "task":"translation_to", + "task":"translation_from", "metric":"bleu", - "score":0.3804672237, - "sentence_nr":3 + "score":0.0865856519 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"openai\/gpt-3.5-turbo-0613", "bcp_47":"bn", - "task":"translation_to", + "task":"translation_from", "metric":"chrf", - "score":0.4337083419, - "sentence_nr":3 + "score":0.3670408519 }, { - "model":"openai\/gpt-4.1-mini", + "model":"openai\/gpt-3.5-turbo-0613", "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.4171995809, - "sentence_nr":3 + "score":0.1246701174 }, { - "model":"openai\/gpt-4.1-mini", + "model":"openai\/gpt-3.5-turbo-0613", "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.4623764371, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.6237774736, - "sentence_nr":3 + "score":0.3844904766 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.8500131525, - "sentence_nr":3 + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"de", + "task":"translation_from", "metric":"bleu", - "score":0.5737647229, - "sentence_nr":3 + "score":0.255733121 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"de", + "task":"translation_from", "metric":"chrf", - "score":0.8179798595, - "sentence_nr":3 + "score":0.4745347601 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.2320305803, - "sentence_nr":3 + "score":0.3450910905 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.6224956013, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2144945948, - "sentence_nr":3 + "score":0.593965846 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6528501353, - "sentence_nr":3 + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"en", + "task":"translation_from", "metric":"bleu", - "score":0.2244975801, - "sentence_nr":3 + "score":0.3751847049 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"en", + "task":"translation_from", "metric":"chrf", - "score":0.5326826664, - "sentence_nr":3 + "score":0.5546252024 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.8482942955, - "sentence_nr":3 + "score":0.4781043171 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.9256238041, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 + "score":0.6714236508 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"es", + "task":"translation_from", "metric":"bleu", - "score":1.0, - "sentence_nr":3 + "score":0.1971959428 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"es", + "task":"translation_from", "metric":"chrf", - "score":1.0, - "sentence_nr":3 + "score":0.4525212046 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":3 + "score":0.3678222384 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.8482942955, - "sentence_nr":3 + "score":0.5884629819 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.9256238041, - "sentence_nr":3 + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"fr", + "task":"translation_from", "metric":"bleu", - "score":0.201640652, - "sentence_nr":3 + "score":0.1903326188 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"fr", + "task":"translation_from", "metric":"chrf", - "score":0.392353398, - "sentence_nr":3 + "score":0.4492193992 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.4212555585, - "sentence_nr":3 + "score":0.3974812512 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.4426408937, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2750774388, - "sentence_nr":3 + "score":0.5872620046 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.3471215691, - "sentence_nr":3 + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"hi", + "task":"translation_from", "metric":"bleu", - "score":0.3132288506, - "sentence_nr":3 + "score":0.3091104445 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"hi", + "task":"translation_from", "metric":"chrf", - "score":0.3821582739, - "sentence_nr":3 + "score":0.5239666365 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.3286610737, - "sentence_nr":3 + "score":0.308658779 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.385722787, - "sentence_nr":3 + "score":0.4943494838 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"id", + "task":"translation_from", "metric":"bleu", - "score":0.3471790743, - "sentence_nr":3 + "score":0.1558351322 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"id", + "task":"translation_from", "metric":"chrf", - "score":0.5354826965, - "sentence_nr":3 + "score":0.4339633925 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.1452867953, - "sentence_nr":3 + "score":0.2667443989 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.4562626418, - "sentence_nr":3 + "score":0.5471646551 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"ja", + "task":"translation_from", "metric":"bleu", - "score":0.2114623992, - "sentence_nr":3 + "score":0.2512075408 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"ja", + "task":"translation_from", "metric":"chrf", - "score":0.3672220684, - "sentence_nr":3 + "score":0.4781485122 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.1136535202, - "sentence_nr":3 + "score":0.3294110726 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.5427832684, - "sentence_nr":3 + "score":0.4419761829 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"jv", + "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":3 + "score":0.1874700943 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"jv", + "task":"translation_from", "metric":"chrf", - "score":0.4062083693, - "sentence_nr":3 + "score":0.3668478037 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":1.0, - "sentence_nr":4 + "score":0.2179816276 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":1.0, - "sentence_nr":4 + "score":0.4537309029 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"mr", + "task":"translation_from", "metric":"bleu", - "score":1.0, - "sentence_nr":4 + "score":0.1293703417 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"mr", + "task":"translation_from", "metric":"chrf", - "score":1.0, - "sentence_nr":4 + "score":0.3740601424 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":1.0, - "sentence_nr":4 + "score":0.1316417996 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":1.0, - "sentence_nr":4 + "score":0.3104567715 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"pa", + "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.223477129 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"pa", + "task":"translation_from", "metric":"chrf", - "score":0.2246029758, - "sentence_nr":4 + "score":0.4562631144 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":1.0, - "sentence_nr":4 + "score":0.2876949296 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":1.0, - "sentence_nr":4 + "score":0.4857260461 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"pt", + "task":"translation_from", "metric":"bleu", - "score":0.4765874091, - "sentence_nr":4 + "score":0.1820530207 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"pt", + "task":"translation_from", "metric":"chrf", - "score":0.4591155777, - "sentence_nr":4 + "score":0.4181188719 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.4502212538, - "sentence_nr":4 + "score":0.417401324 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.4687426738, - "sentence_nr":4 + "score":0.6189673269 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"ru", + "task":"translation_from", "metric":"bleu", - "score":0.6350593429, - "sentence_nr":4 + "score":0.1434775736 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"ru", + "task":"translation_from", "metric":"chrf", - "score":0.6022395695, - "sentence_nr":4 + "score":0.4131789962 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.3407065042, - "sentence_nr":4 + "score":0.2902641383 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.3482814151, - "sentence_nr":4 + "score":0.5067661761 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"sw", + "task":"translation_from", "metric":"bleu", - "score":0.7215691881, - "sentence_nr":4 + "score":0.1838174977 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"sw", + "task":"translation_from", "metric":"chrf", - "score":0.7351007898, - "sentence_nr":4 + "score":0.446335194 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.2979831166 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.3013901676, - "sentence_nr":4 + "score":0.5546563707 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"te", + "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.1576206892 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"te", + "task":"translation_from", "metric":"chrf", - "score":0.3810601296, - "sentence_nr":4 + "score":0.3790307912 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.1221954617 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.3518774507, - "sentence_nr":4 + "score":0.3360330123 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"ur", + "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.1353612029 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"ur", + "task":"translation_from", "metric":"chrf", - "score":0.2850647115, - "sentence_nr":4 + "score":0.36632891 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.1357613569 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.3190905975, - "sentence_nr":4 + "score":0.3657578763 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"vi", + "task":"translation_from", "metric":"bleu", - "score":0.3820562307, - "sentence_nr":4 + "score":0.1119834897 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"vi", + "task":"translation_from", "metric":"chrf", - "score":0.5488313413, - "sentence_nr":4 + "score":0.3394106853 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.3809137042, - "sentence_nr":4 + "score":0.1986904894 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.5405504436, - "sentence_nr":4 + "score":0.3757062086 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"zh", + "task":"translation_from", "metric":"bleu", - "score":0.3820562307, - "sentence_nr":4 + "score":0.1621574248 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"zh", + "task":"translation_from", "metric":"chrf", - "score":0.5488313413, - "sentence_nr":4 + "score":0.4283684768 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.3631474834, - "sentence_nr":4 + "score":0.2167142755 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", + "model":"openai\/gpt-3.5-turbo-0613", + "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.5392658386, - "sentence_nr":4 + "score":0.2830134241 }, { "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2293530952, - "sentence_nr":4 + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 }, { "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4689601315, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", "bcp_47":"ar", - "task":"translation_to", + "task":"translation_from", "metric":"bleu", - "score":0.2294068721, - "sentence_nr":4 + "score":0.2353582779 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"openai\/gpt-4.1-mini", "bcp_47":"ar", - "task":"translation_to", + "task":"translation_from", "metric":"chrf", - "score":0.4045836405, - "sentence_nr":4 + "score":0.5006899773 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"openai\/gpt-4.1-mini", "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.3664710407 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"openai\/gpt-4.1-mini", "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.3258864375, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 + "score":0.5606190587 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.3200317028, - "sentence_nr":4 + "model":"openai\/gpt-4.1-mini", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"bn", + "task":"translation_from", "metric":"bleu", - "score":0.2308824748, - "sentence_nr":4 + "score":0.2553082196 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"bn", + "task":"translation_from", "metric":"chrf", - "score":0.4093450186, - "sentence_nr":4 + "score":0.488512704 }, { "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", + "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.232779904, - "sentence_nr":4 + "score":0.2688722519 }, { "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", + "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.4150815685, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.4523791233, - "sentence_nr":4 + "score":0.4454248715 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.6299071574, - "sentence_nr":4 + "model":"openai\/gpt-4.1-mini", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"de", + "task":"translation_from", "metric":"bleu", - "score":0.2373681044, - "sentence_nr":4 + "score":0.2566663279 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"de", + "task":"translation_from", "metric":"chrf", - "score":0.4004852416, - "sentence_nr":4 + "score":0.5174970249 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.2916261379, - "sentence_nr":4 + "score":0.4322161955 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.4106520927, - "sentence_nr":4 + "score":0.6526227117 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"en", + "task":"translation_from", "metric":"bleu", - "score":0.2827647331, - "sentence_nr":4 + "score":0.4934809373 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"en", + "task":"translation_from", "metric":"chrf", - "score":0.3743678965, - "sentence_nr":4 + "score":0.6722291033 }, { "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", + "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.1100868155, - "sentence_nr":4 + "score":0.6327969379 }, { "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", + "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.297203493, - "sentence_nr":4 + "score":0.8005146414 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"es", + "task":"translation_from", "metric":"bleu", - "score":0.5605065819, - "sentence_nr":4 + "score":0.235589316 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"es", + "task":"translation_from", "metric":"chrf", - "score":0.5868532678, - "sentence_nr":4 + "score":0.5063165811 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.3630029634, - "sentence_nr":4 + "score":0.3911713119 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.5816676674, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.352539976, - "sentence_nr":4 + "score":0.6242017348 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"openai\/gpt-4.1-mini", "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.579811697, - "sentence_nr":4 + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"openai\/gpt-4.1-mini", "bcp_47":"fr", - "task":"translation_to", + "task":"translation_from", "metric":"bleu", - "score":0.3927053213, - "sentence_nr":4 + "score":0.311885366 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"openai\/gpt-4.1-mini", "bcp_47":"fr", - "task":"translation_to", + "task":"translation_from", "metric":"chrf", - "score":0.5108598155, - "sentence_nr":4 + "score":0.5786679545 }, { "model":"openai\/gpt-4.1-mini", "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.5369357392, - "sentence_nr":4 + "score":0.5123128835 }, { "model":"openai\/gpt-4.1-mini", "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.5869601651, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2876540853, - "sentence_nr":4 + "score":0.6920494347 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4046608868, - "sentence_nr":4 + "model":"openai\/gpt-4.1-mini", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"hi", + "task":"translation_from", "metric":"bleu", - "score":0.1819722649, - "sentence_nr":4 + "score":0.3452221913 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"hi", + "task":"translation_from", "metric":"chrf", - "score":0.4425473022, - "sentence_nr":4 + "score":0.5902403977 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.2529183169, - "sentence_nr":4 + "score":0.381895318 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.4482360279, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2796002691, - "sentence_nr":4 + "score":0.5898272046 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4817204985, - "sentence_nr":4 + "model":"openai\/gpt-4.1-mini", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", + "bcp_47":"id", + "task":"translation_from", "metric":"bleu", - "score":0.1708721495, - "sentence_nr":4 + "score":0.2855978621 }, { "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", + "bcp_47":"id", + "task":"translation_from", "metric":"chrf", - "score":0.3646964804, - "sentence_nr":4 + "score":0.5472063766 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.1330519954, - "sentence_nr":4 + "score":0.3721127194 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.4324498727, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3377385621, - "sentence_nr":4 + "score":0.6463029364 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.525612845, - "sentence_nr":4 + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ja", + "task":"translation_from", "metric":"bleu", - "score":0.4477604756, - "sentence_nr":4 + "score":0.288264373 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ja", + "task":"translation_from", "metric":"chrf", - "score":0.5801193948, - "sentence_nr":4 + "score":0.5359086837 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.287558382, - "sentence_nr":4 + "score":0.3670619927 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.6087635831, - "sentence_nr":4 + "score":0.5068433812 }, { "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", + "bcp_47":"jv", + "task":"translation_from", "metric":"bleu", - "score":0.3569375456, - "sentence_nr":4 + "score":0.3051034461 }, { "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", + "bcp_47":"jv", + "task":"translation_from", "metric":"chrf", - "score":0.5492415189, - "sentence_nr":4 + "score":0.5471092112 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.1254691277, - "sentence_nr":4 + "score":0.2747623728 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.2651343524, - "sentence_nr":4 + "score":0.5861307631 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"mr", + "task":"translation_from", "metric":"bleu", - "score":0.1240721616, - "sentence_nr":4 + "score":0.2464469919 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"mr", + "task":"translation_from", "metric":"chrf", - "score":0.2664864612, - "sentence_nr":4 + "score":0.4954666446 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.1126159789, - "sentence_nr":4 + "score":0.2249035276 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.2523482734, - "sentence_nr":4 + "score":0.4254292104 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"openai\/gpt-4.1-mini", "bcp_47":"pa", - "task":"translation_to", + "task":"translation_from", "metric":"bleu", - "score":0.1275785595, - "sentence_nr":4 + "score":0.4045917852 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"openai\/gpt-4.1-mini", "bcp_47":"pa", - "task":"translation_to", + "task":"translation_from", "metric":"chrf", - "score":0.3385577202, - "sentence_nr":4 + "score":0.6244183732 }, { "model":"openai\/gpt-4.1-mini", "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.0841173493, - "sentence_nr":4 + "score":0.4219453949 }, { "model":"openai\/gpt-4.1-mini", "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.2901271494, - "sentence_nr":4 + "score":0.5730380868 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"pt", + "task":"translation_from", "metric":"bleu", - "score":0.5322520826, - "sentence_nr":4 + "score":0.2852961117 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"pt", + "task":"translation_from", "metric":"chrf", - "score":0.7271316675, - "sentence_nr":4 + "score":0.5549713299 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.5266403878, - "sentence_nr":4 + "score":0.4724645835 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.6838125749, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5276151436, - "sentence_nr":4 + "score":0.6736886701 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"openai\/gpt-4.1-mini", "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6871514991, - "sentence_nr":4 + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"openai\/gpt-4.1-mini", "bcp_47":"ru", - "task":"translation_to", + "task":"translation_from", "metric":"bleu", - "score":0.5276151436, - "sentence_nr":4 + "score":0.2092871331 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"openai\/gpt-4.1-mini", "bcp_47":"ru", - "task":"translation_to", + "task":"translation_from", "metric":"chrf", - "score":0.699912443, - "sentence_nr":4 + "score":0.4879651984 }, { "model":"openai\/gpt-4.1-mini", "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.5322520826, - "sentence_nr":4 + "score":0.4104606671 }, { "model":"openai\/gpt-4.1-mini", "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.7271316675, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2092659579, - "sentence_nr":4 + "score":0.6062298906 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"openai\/gpt-4.1-mini", "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.535476676, - "sentence_nr":4 + "task":"mmlu", + "metric":"accuracy", + "score":0.5 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"openai\/gpt-4.1-mini", "bcp_47":"sw", - "task":"translation_to", + "task":"translation_from", "metric":"bleu", - "score":0.1284866897, - "sentence_nr":4 + "score":0.2119039225 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"openai\/gpt-4.1-mini", "bcp_47":"sw", - "task":"translation_to", + "task":"translation_from", "metric":"chrf", - "score":0.5495968221, - "sentence_nr":4 + "score":0.4718779729 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"openai\/gpt-4.1-mini", "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.3099627272, - "sentence_nr":4 + "score":0.3482867389 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"openai\/gpt-4.1-mini", "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.5376391724, - "sentence_nr":4 + "score":0.6083272302 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"te", + "task":"translation_from", "metric":"bleu", - "score":0.1574248334, - "sentence_nr":4 + "score":0.292187148 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"te", + "task":"translation_from", "metric":"chrf", - "score":0.4351951744, - "sentence_nr":4 + "score":0.5292968897 }, { "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.5074919773, - "sentence_nr":4 + "score":0.2456913217 }, { "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.6528956125, - "sentence_nr":4 + "score":0.4548022965 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ur", + "task":"translation_from", "metric":"bleu", - "score":0.2887138087, - "sentence_nr":5 + "score":0.2215148184 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ur", + "task":"translation_from", "metric":"chrf", - "score":0.6342291346, - "sentence_nr":5 + "score":0.4881854895 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":1.0, - "sentence_nr":5 + "score":0.2641606665 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":1.0, - "sentence_nr":5 + "score":0.4480825493 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"vi", + "task":"translation_from", "metric":"bleu", - "score":0.7013062757, - "sentence_nr":5 + "score":0.2163224434 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"vi", + "task":"translation_from", "metric":"chrf", - "score":0.9303769449, - "sentence_nr":5 + "score":0.4949463826 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":5 + "score":0.3086902722 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", + "model":"openai\/gpt-4.1-mini", + "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.23816585, - "sentence_nr":5 + "score":0.5554756761 }, { "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4.1-mini", + "bcp_47":"zh", + "task":"translation_from", "metric":"bleu", - "score":1.0, - "sentence_nr":5 + "score":0.207708073 }, { "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", + "bcp_47":"zh", + "task":"translation_from", "metric":"chrf", - "score":1.0, - "sentence_nr":5 + "score":0.4816364739 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"openai\/gpt-4.1-mini", "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.3758990206, - "sentence_nr":5 + "score":0.2818179571 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"openai\/gpt-4.1-mini", "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.4255415128, - "sentence_nr":5 + "score":0.3369663048 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2074813196, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2716205232, - "sentence_nr":5 + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ar", + "task":"translation_from", "metric":"bleu", - "score":0.2074813196, - "sentence_nr":5 + "score":0.2325698513 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ar", + "task":"translation_from", "metric":"chrf", - "score":0.2716205232, - "sentence_nr":5 + "score":0.4900910318 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.1927292346, - "sentence_nr":5 + "score":0.3273886017 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.3145892043, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2074813196, - "sentence_nr":5 + "score":0.5507594814 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2716205232, - "sentence_nr":5 + "model":"openai\/gpt-4.1-nano", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"bn", + "task":"translation_from", "metric":"bleu", - "score":0.4298810543, - "sentence_nr":5 + "score":0.1825189442 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"bn", + "task":"translation_from", "metric":"chrf", - "score":0.7577244658, - "sentence_nr":5 + "score":0.4341218556 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.5366411242, - "sentence_nr":5 + "score":0.2624070312 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.8255664943, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.6179396438, - "sentence_nr":5 + "score":0.4731044972 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.866516296, - "sentence_nr":5 + "model":"openai\/gpt-4.1-nano", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"de", + "task":"translation_from", "metric":"bleu", - "score":0.4360038791, - "sentence_nr":5 + "score":0.2633872752 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"de", + "task":"translation_from", "metric":"chrf", - "score":0.7669087485, - "sentence_nr":5 + "score":0.5250805862 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.4563369808, - "sentence_nr":5 + "score":0.3914347425 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.787353904, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4165530721, - "sentence_nr":5 + "score":0.6094934561 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.702780513, - "sentence_nr":5 + "model":"openai\/gpt-4.1-nano", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"en", + "task":"translation_from", "metric":"bleu", - "score":0.4027788022, - "sentence_nr":5 + "score":0.4631079117 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"en", + "task":"translation_from", "metric":"chrf", - "score":0.6872835607, - "sentence_nr":5 + "score":0.6442114257 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.4024582794, - "sentence_nr":5 + "score":0.5299774376 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.6664090182, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 + "score":0.7380736765 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"openai\/gpt-4.1-nano", "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5552412315, - "sentence_nr":5 + "task":"mmlu", + "metric":"accuracy", + "score":0.4 }, { - "model":"openai\/gpt-4.1-mini", + "model":"openai\/gpt-4.1-nano", "bcp_47":"es", - "task":"translation_to", + "task":"translation_from", "metric":"bleu", - "score":0.6976333496, - "sentence_nr":5 + "score":0.2274715114 }, { - "model":"openai\/gpt-4.1-mini", + "model":"openai\/gpt-4.1-nano", "bcp_47":"es", - "task":"translation_to", + "task":"translation_from", "metric":"chrf", - "score":0.8331572108, - "sentence_nr":5 + "score":0.4837759577 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.4130732371, - "sentence_nr":5 + "score":0.3124440889 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.5785653392, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.5248587176, - "sentence_nr":5 + "score":0.5261084633 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6664855309, - "sentence_nr":5 + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fr", + "task":"translation_from", "metric":"bleu", - "score":0.5248587176, - "sentence_nr":5 + "score":0.2312533162 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fr", + "task":"translation_from", "metric":"chrf", - "score":0.6664855309, - "sentence_nr":5 + "score":0.4815491459 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.3279713812, - "sentence_nr":5 + "score":0.455086296 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.4864562825, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4987046236, - "sentence_nr":5 + "score":0.6474755177 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.647874639, - "sentence_nr":5 + "model":"openai\/gpt-4.1-nano", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"hi", + "task":"translation_from", "metric":"bleu", - "score":0.1772984226, - "sentence_nr":5 + "score":0.2652800435 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"hi", + "task":"translation_from", "metric":"chrf", - "score":0.4103582048, - "sentence_nr":5 + "score":0.5175523714 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.3489583637, - "sentence_nr":5 + "score":0.3386268714 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.4767378359, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.4010889715, - "sentence_nr":5 + "score":0.5633372903 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5642546048, - "sentence_nr":5 + "model":"openai\/gpt-4.1-nano", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"id", + "task":"translation_from", "metric":"bleu", - "score":0.3014528044, - "sentence_nr":5 + "score":0.1907857214 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"id", + "task":"translation_from", "metric":"chrf", - "score":0.472975393, - "sentence_nr":5 + "score":0.4650956372 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.2199206296, - "sentence_nr":5 + "score":0.3541709408 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.4070442354, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 + "score":0.6291579219 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ja", + "task":"translation_from", "metric":"bleu", - "score":0.8958039312, - "sentence_nr":5 + "score":0.1469461673 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ja", + "task":"translation_from", "metric":"chrf", - "score":0.9382091007, - "sentence_nr":5 + "score":0.4392693708 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.6433799262, - "sentence_nr":5 + "score":0.2078261662 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.8103769737, - "sentence_nr":5 + "score":0.3748504876 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"jv", + "task":"translation_from", "metric":"bleu", - "score":0.5403356451, - "sentence_nr":5 + "score":0.2484943284 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"jv", + "task":"translation_from", "metric":"chrf", - "score":0.7639130574, - "sentence_nr":5 + "score":0.4654993953 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":1.0, - "sentence_nr":5 + "score":0.2497434284 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":1.0, - "sentence_nr":5 + "score":0.5490071169 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"mr", + "task":"translation_from", "metric":"bleu", - "score":0.4500531895, - "sentence_nr":5 + "score":0.1625330023 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"mr", + "task":"translation_from", "metric":"chrf", - "score":0.4302706554, - "sentence_nr":5 + "score":0.4495751195 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.4933292241, - "sentence_nr":5 + "score":0.2157605321 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.5225247298, - "sentence_nr":5 + "score":0.456208027 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"pa", + "task":"translation_from", "metric":"bleu", - "score":0.234878114, - "sentence_nr":5 + "score":0.3790606838 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"pa", + "task":"translation_from", "metric":"chrf", - "score":0.4062284747, - "sentence_nr":5 + "score":0.6045377359 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.3763743474, - "sentence_nr":5 + "score":0.3874235881 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.4017565065, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.5135063581, - "sentence_nr":5 + "score":0.5593657469 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5263652477, - "sentence_nr":5 + "model":"openai\/gpt-4.1-nano", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"openai\/gpt-4.1-nano", "bcp_47":"pt", - "task":"translation_to", + "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":5 + "score":0.2760123498 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"openai\/gpt-4.1-nano", "bcp_47":"pt", - "task":"translation_to", + "task":"translation_from", "metric":"chrf", - "score":0.5212982931, - "sentence_nr":5 + "score":0.5134357242 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"openai\/gpt-4.1-nano", "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.3531901509, - "sentence_nr":5 + "score":0.416752628 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"openai\/gpt-4.1-nano", "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.5822934956, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3531901509, - "sentence_nr":5 + "score":0.6215563908 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5822934956, - "sentence_nr":5 + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ru", + "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":5 + "score":0.1853930017 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ru", + "task":"translation_from", "metric":"chrf", - "score":0.5095895502, - "sentence_nr":5 + "score":0.465375097 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.3532802306, - "sentence_nr":5 + "score":0.2860173151 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.5839265502, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3855522726, - "sentence_nr":5 + "score":0.5480059055 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5872605669, - "sentence_nr":5 + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sw", + "task":"translation_from", "metric":"bleu", - "score":0.4426623527, - "sentence_nr":5 + "score":0.2010282492 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sw", + "task":"translation_from", "metric":"chrf", - "score":0.636837103, - "sentence_nr":5 + "score":0.4493062791 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.366634099, - "sentence_nr":5 + "score":0.2458134572 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.5782960279, - "sentence_nr":5 + "score":0.5476246368 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"te", + "task":"translation_from", "metric":"bleu", - "score":0.3289267652, - "sentence_nr":5 + "score":0.2087672996 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"te", + "task":"translation_from", "metric":"chrf", - "score":0.580076131, - "sentence_nr":5 + "score":0.4716980224 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.4655035539, - "sentence_nr":5 + "score":0.1943752237 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.6467306329, - "sentence_nr":5 + "score":0.4205022979 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ur", + "task":"translation_from", "metric":"bleu", - "score":0.1965085477, - "sentence_nr":5 + "score":0.1759186135 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ur", + "task":"translation_from", "metric":"chrf", - "score":0.5134302168, - "sentence_nr":5 + "score":0.4432474082 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":5 + "score":0.242532014 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.5187615227, - "sentence_nr":5 + "score":0.4305022436 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"vi", + "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":5 + "score":0.1547443459 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"vi", + "task":"translation_from", "metric":"chrf", - "score":0.5205634208, - "sentence_nr":5 + "score":0.4483479472 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":5 + "score":0.2971306268 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.5187615227, - "sentence_nr":5 + "score":0.5596664411 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4.1-nano", + "bcp_47":"zh", + "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":5 + "score":0.1404632343 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"zh", + "task":"translation_from", "metric":"chrf", - "score":0.5287371836, - "sentence_nr":5 + "score":0.4382880735 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.5106109398, - "sentence_nr":5 + "score":0.2230925442 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", + "model":"openai\/gpt-4.1-nano", + "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.7688046995, - "sentence_nr":5 + "score":0.3010591018 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"ar", + "task":"translation_from", "metric":"bleu", - "score":0.4477845944, - "sentence_nr":5 + "score":0.2260572099 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ar", + "task":"translation_from", "metric":"chrf", - "score":0.7043336945, - "sentence_nr":5 + "score":0.5164260772 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.3221411249, - "sentence_nr":5 + "score":0.3098248698 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.7794716829, - "sentence_nr":5 + "score":0.536672296 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"bn", + "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":5 + "score":0.1851732693 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"bn", + "task":"translation_from", "metric":"chrf", - "score":0.556499296, - "sentence_nr":5 + "score":0.4399312653 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"openai\/gpt-4o-mini", + "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.5129586382, - "sentence_nr":5 + "score":0.305694311 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", + "model":"openai\/gpt-4o-mini", + "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.7857394056, - "sentence_nr":5 + "score":0.4860162598 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"de", + "task":"translation_from", "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 + "score":0.2442519451 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"de", + "task":"translation_from", "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 + "score":0.5003799076 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", + "model":"openai\/gpt-4o-mini", + "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":1.0, - "sentence_nr":6 + "score":0.3647222325 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", + "model":"openai\/gpt-4o-mini", + "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":6 + "score":0.6024672844 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"openai\/gpt-4o-mini", "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":6 + "task":"mmlu", + "metric":"accuracy", + "score":0.7 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"openai\/gpt-4o-mini", "bcp_47":"en", - "task":"translation_to", + "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":6 + "score":0.4797368411 }, { - "model":"meta-llama\/llama-3-70b-instruct", + "model":"openai\/gpt-4o-mini", "bcp_47":"en", - "task":"translation_to", + "task":"translation_from", "metric":"chrf", - "score":0.3263040637, - "sentence_nr":6 + "score":0.6374317341 }, { - "model":"openai\/gpt-4.1-mini", + "model":"openai\/gpt-4o-mini", "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 + "score":0.6311582936 }, { - "model":"openai\/gpt-4.1-mini", + "model":"openai\/gpt-4o-mini", "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.5561195823, - "sentence_nr":6 + "score":0.7997371179 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.5362935676, - "sentence_nr":6 + "model":"openai\/gpt-4o-mini", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"es", + "task":"translation_from", "metric":"bleu", - "score":0.5803515898, - "sentence_nr":6 + "score":0.2600341328 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"es", + "task":"translation_from", "metric":"chrf", - "score":0.5422220469, - "sentence_nr":6 + "score":0.4963209525 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", + "model":"openai\/gpt-4o-mini", + "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.4204739941, - "sentence_nr":6 + "score":0.417992948 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", + "model":"openai\/gpt-4o-mini", + "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.5173824079, - "sentence_nr":6 + "score":0.640138245 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"fr", + "task":"translation_from", "metric":"bleu", - "score":0.4177866849, - "sentence_nr":6 + "score":0.2376904256 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fr", + "task":"translation_from", "metric":"chrf", - "score":0.5243375045, - "sentence_nr":6 + "score":0.5011085853 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.4593860924, - "sentence_nr":6 + "score":0.4849594812 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", + "model":"openai\/gpt-4o-mini", + "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.5045746405, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3343829907, - "sentence_nr":6 + "score":0.6766251104 }, { - "model":"meta-llama\/llama-4-maverick", + "model":"openai\/gpt-4o-mini", "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5409759573, - "sentence_nr":6 + "task":"mmlu", + "metric":"accuracy", + "score":0.9 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"openai\/gpt-4o-mini", "bcp_47":"hi", - "task":"translation_to", + "task":"translation_from", "metric":"bleu", - "score":0.3785406892, - "sentence_nr":6 + "score":0.3234457974 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", + "model":"openai\/gpt-4o-mini", "bcp_47":"hi", - "task":"translation_to", + "task":"translation_from", "metric":"chrf", - "score":0.5743796566, - "sentence_nr":6 + "score":0.5370126468 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"openai\/gpt-4o-mini", "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.3785406892, - "sentence_nr":6 + "score":0.3996080448 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", + "model":"openai\/gpt-4o-mini", "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.5768306472, - "sentence_nr":6 + "score":0.6023656967 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"id", + "task":"translation_from", "metric":"bleu", - "score":0.3213450436, - "sentence_nr":6 + "score":0.2125374969 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"id", + "task":"translation_from", "metric":"chrf", - "score":0.5076725974, - "sentence_nr":6 + "score":0.5022908944 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"openai\/gpt-4o-mini", + "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.3075951598, - "sentence_nr":6 + "score":0.2960726977 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", + "model":"openai\/gpt-4o-mini", + "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.4988668236, - "sentence_nr":6 + "score":0.5881822388 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"ja", + "task":"translation_from", "metric":"bleu", - "score":0.4550680331, - "sentence_nr":6 + "score":0.281578672 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ja", + "task":"translation_from", "metric":"chrf", - "score":0.6477506541, - "sentence_nr":6 + "score":0.4963026763 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.5923136157, - "sentence_nr":6 + "score":0.3509105353 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.7382416556, - "sentence_nr":6 + "score":0.4772595136 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"jv", + "task":"translation_from", "metric":"bleu", - "score":0.5923136157, - "sentence_nr":6 + "score":0.244859193 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"jv", + "task":"translation_from", "metric":"chrf", - "score":0.7568286018, - "sentence_nr":6 + "score":0.4719413896 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", + "model":"openai\/gpt-4o-mini", + "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.5521710658, - "sentence_nr":6 + "score":0.2375487692 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", + "model":"openai\/gpt-4o-mini", + "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.7317828776, - "sentence_nr":6 + "score":0.5454443303 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"mr", + "task":"translation_from", "metric":"bleu", - "score":0.5521710658, - "sentence_nr":6 + "score":0.2071473102 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"mr", + "task":"translation_from", "metric":"chrf", - "score":0.7317828776, - "sentence_nr":6 + "score":0.4103819252 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", + "model":"openai\/gpt-4o-mini", + "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.4018202851, - "sentence_nr":6 + "score":0.2256200492 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", + "model":"openai\/gpt-4o-mini", + "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.6003256952, - "sentence_nr":6 + "score":0.4419952711 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"pa", + "task":"translation_from", "metric":"bleu", - "score":0.5804511284, - "sentence_nr":6 + "score":0.3531564234 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"pa", + "task":"translation_from", "metric":"chrf", - "score":0.7542976177, - "sentence_nr":6 + "score":0.5805142329 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", + "model":"openai\/gpt-4o-mini", + "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.4018202851, - "sentence_nr":6 + "score":0.3707122189 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", + "model":"openai\/gpt-4o-mini", + "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.6003256952, - "sentence_nr":6 + "score":0.5524474478 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"pt", + "task":"translation_from", "metric":"bleu", - "score":0.0, - "sentence_nr":6 + "score":0.2673214525 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"pt", + "task":"translation_from", "metric":"chrf", - "score":0.5263574469, - "sentence_nr":6 + "score":0.5155609027 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", + "model":"openai\/gpt-4o-mini", + "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.5582486914, - "sentence_nr":6 + "score":0.440844237 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", + "model":"openai\/gpt-4o-mini", + "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.6678493404, - "sentence_nr":6 + "score":0.6696954647 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"ru", + "task":"translation_from", "metric":"bleu", - "score":0.3771745743, - "sentence_nr":6 + "score":0.2144471986 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ru", + "task":"translation_from", "metric":"chrf", - "score":0.5554130492, - "sentence_nr":6 + "score":0.4935159532 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.0, - "sentence_nr":6 + "score":0.3268453207 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.3159892348, - "sentence_nr":6 + "score":0.5715958119 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"sw", + "task":"translation_from", "metric":"bleu", - "score":0.1895316299, - "sentence_nr":6 + "score":0.2086488438 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"sw", + "task":"translation_from", "metric":"chrf", - "score":0.4587674595, - "sentence_nr":6 + "score":0.4503413027 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", + "model":"openai\/gpt-4o-mini", + "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.2383770505, - "sentence_nr":6 + "score":0.3062254829 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", + "model":"openai\/gpt-4o-mini", + "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.4666458696, - "sentence_nr":6 + "score":0.585118766 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"te", + "task":"translation_from", "metric":"bleu", - "score":0.2556795749, - "sentence_nr":6 + "score":0.2751005462 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"te", + "task":"translation_from", "metric":"chrf", - "score":0.4561555898, - "sentence_nr":6 + "score":0.4938464228 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", + "model":"openai\/gpt-4o-mini", + "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.7629273293, - "sentence_nr":6 + "score":0.200746746 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", + "model":"openai\/gpt-4o-mini", + "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.8510385545, - "sentence_nr":6 + "score":0.4753275787 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ur", + "task":"translation_from", "metric":"bleu", - "score":0.8725129388, - "sentence_nr":6 + "score":0.2271037726 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ur", + "task":"translation_from", "metric":"chrf", - "score":0.9495292424, - "sentence_nr":6 + "score":0.4884796205 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.8725129388, - "sentence_nr":6 + "score":0.2821385341 }, { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", + "model":"openai\/gpt-4o-mini", + "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.9094153226, - "sentence_nr":6 + "score":0.4794553557 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"vi", + "task":"translation_from", "metric":"bleu", - "score":0.8725129388, - "sentence_nr":6 + "score":0.2177425012 }, { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"vi", + "task":"translation_from", "metric":"chrf", - "score":0.9495292424, - "sentence_nr":6 + "score":0.4737357708 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", + "model":"openai\/gpt-4o-mini", + "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.6425503167, - "sentence_nr":6 + "score":0.2936126961 }, { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", + "model":"openai\/gpt-4o-mini", + "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.807889193, - "sentence_nr":6 + "score":0.5463661979 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"openai\/gpt-4o-mini", + "bcp_47":"zh", + "task":"translation_from", "metric":"bleu", - "score":0.4934916371, - "sentence_nr":6 + "score":0.1648676261 }, { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", + "model":"openai\/gpt-4o-mini", + "bcp_47":"zh", + "task":"translation_from", "metric":"chrf", - "score":0.694445271, - "sentence_nr":6 + "score":0.4464998109 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", + "model":"openai\/gpt-4o-mini", + "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.303764309, - "sentence_nr":6 + "score":0.2613931597 }, { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5183662698, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1837671115, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3981272326, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3409605607, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5217663813, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2989898445, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5359750729, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.8253498773, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.8529564805, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.7944837206, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.878453174, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.7944837206, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.878453174, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.6941268298, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7679844671, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.5828833474, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.7908226509, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3869431776, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5953878513, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2620499196, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4893724002, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2212877653, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4999323991, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4272870064, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.6271734609, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5040673596, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6469962279, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2281684904, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4984990869, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5106109398, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6635467153, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.325909498, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5501364765, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.7498810286, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7726337965, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3954948172, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4821021676, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5029543425, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2254310841, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5721164466, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4884391792, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7050595168, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4902350231, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7638414724, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4424906783, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7055079713, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4145278784, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6973605664, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4103230277, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6634154487, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.6380575768, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.824567364, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0786010539, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.0967837769, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1160114131, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2167118757, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2390076355, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3357015413, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1371661844, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2345567914, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1809155303, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3604670694, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3501522472, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5701648579, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3349252033, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5908087432, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3258812298, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5753985305, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2883113323, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5835478395, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2347500093, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5032853946, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.344905813, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.536561983, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2968884568, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5494319015, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3257602417, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.566659654, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2251114029, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5538390232, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3029863251, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5652374403, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2537603225, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5334329404, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2003914161, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.3612331209, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.0564437248, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1502603746, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4303467795, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3275231027, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6168686838, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3270769537, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5166643607, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3069937936, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5024648106, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3575909322, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5409483829, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2228729825, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4466759653, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2662960357, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5253549609, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3927237742, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7451438087, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5570357635, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.8116469942, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3508597297, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6833592152, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.2125947044, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5863866794, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.443404947, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7587103444, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3826576187, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6071841372, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3447241448, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5531085141, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3178743908, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5513949312, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1883251048, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4530322538, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.0192989769, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3112863571, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6304411194, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1330856181, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5312476702, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.257912492, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5545120254, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1595487508, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4511156609, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2369305576, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5928508276, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2879556779, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4554184077, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0957892195, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4047288792, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2296566982, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4624781939, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0892095247, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.322418757, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0659828829, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3008263307, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3872951671, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6571482446, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3299562825, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5982616321, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4381454708, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.616374622, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3614922712, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5698489013, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3957463069, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6093311945, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3665528144, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5966563048, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.258729775, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5132023402, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2914897523, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5714769597, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1115093771, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4170915413, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1206120707, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4663892484, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3480079866, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6148736551, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.312222584, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.5549937871, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.2706573913, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.5619563044, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.2133109831, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.4766025973, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.1985082374, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.5129122522, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2368307518, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2631328191, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1645539243, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1367388582, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.0528214025, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1072112607, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.4615978016, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.6280777654, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.422429895, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.6082308552, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3916177036, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.6068458203, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3045125886, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4983778741, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3916177036, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.6068458203, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.3676904072, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4064141882, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.3472289737, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4103553163, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4155938131, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.328671194, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5944310795, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1354727734, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.483018962, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2297009209, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5537467827, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1354727734, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4685134393, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3498215109, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5324168516, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2822535302, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3874773379, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3174769726, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4079777866, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2822535302, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3818556455, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2822535302, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3785761837, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2822535302, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3818556455, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4693593336, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7730555735, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4336894555, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6409951781, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3681829215, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6273930299, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4389321784, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6468470369, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4336894555, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6805799636, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.316021361, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.516561467, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.307587447, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4684197705, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3716923706, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5383668332, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1865526716, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3640275544, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1420081588, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3704326476, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2961516536, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4980392435, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3459667619, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6170810606, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2362379063, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5441149449, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3593699487, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6492026441, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2989025113, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6058743572, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4683276331, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.8176110135, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.9436043262, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.988019168, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.0067104199, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4593546098, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6086021462, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2338678621, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.466629299, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.1634124231, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4007254932, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.1395211838, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4030284875, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3419664739, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4989057927, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3397180517, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6494995649, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2381198934, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4812080785, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2316879948, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.525267212, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2889285495, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4536746865, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4136211902, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6393493535, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.6031612036, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7362867034, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3943234482, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.5943452555, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3443768664, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6090402109, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3920558089, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6772940234, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4263005629, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6665768162, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1125439789, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2062328899, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1100081929, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1896706167, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1077233201, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2360903687, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1498435849, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2105170009, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1148374893, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2218739144, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2449339028, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4811362511, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1947668131, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4203040773, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3360050269, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5162346122, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1033604925, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3088863285, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2176929795, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.454042834, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3459789902, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5620330456, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3782571349, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5584414289, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.369537503, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5568751295, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4792316814, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6534660189, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4200122603, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6060665796, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1845747513, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4437997152, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1821246362, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4695925404, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.20734617, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5036833881, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2817686971, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5170853674, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2701727285, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5162766223, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2517176763, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.451373445, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3128384317, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4801627921, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3508847644, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5291980445, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2674628639, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.478429215, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2643715067, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4590454051, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4320063812, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6892273788, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3411951585, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6539473951, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4737246708, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7348004695, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5582838438, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7625459507, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5641401219, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7505430817, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4047570083, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4349871721, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4749702454, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3805666011, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4158948448, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5244380104, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6914581279, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4472834999, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.645713027, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4034697489, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5836273992, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.452120997, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6307076431, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5201565256, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6663170491, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.5041542875, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.6074467585, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1877181603, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.375941608, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2828480467, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4330386622, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2631417381, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4194315681, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3180687408, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4375097637, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3368441656, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6173496967, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2105458851, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5020237474, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2108312271, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4950405689, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2259358117, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4781181087, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3653727003, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6006612018, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.112836786, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5027560731, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2943290953, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5637465581, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2066516314, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5424961082, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3720123244, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.185863022, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5550584876, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.5592169701, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.7187320759, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.4438455476, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.6320800719, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.5894973559, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.7562097957, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.3846086977, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5835344719, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.4440401202, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.634367012, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.3742128962, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5924994298, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.3206397177, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5206258402, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.390861271, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6239956806, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.3020679768, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5246291817, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.3629639414, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5313865724, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.8780634321, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.9269467001, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.7964573358, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.8458636472, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.9452996323, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.9463396364, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.8781548422, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.9156314785, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3240643366, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5243586267, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3463367232, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5378805625, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3852076286, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.562982276, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2602101451, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4820043661, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3207234978, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4977201244, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.4318843329, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6011096109, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3582301851, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5380305838, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.4417559394, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6111096353, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3905612193, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5861956607, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.4354870568, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6005516255, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.4641883722, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.640326715, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.3007405773, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5272774705, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.40610665, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6080346531, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.3152039044, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.566675397, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.4045482503, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5951482608, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4422044706, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6089032707, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3099603853, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5209233177, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3093921662, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5208328629, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2417404985, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4540589962, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3443388178, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5341360898, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.4331131004, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5898969623, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3558039927, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5392592206, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.4072470239, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5650294312, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3741026208, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5834523244, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3938763752, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5909459754, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.5274220384, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.676558814, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3931738146, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6026058741, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3229030612, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5136703373, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3113772787, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5344680037, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.4015176111, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5570033942, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.427346675, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6397906518, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4893093641, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6990856292, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4951704011, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6726500193, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.474262745, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6547171932, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.5534262126, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.7517262393, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3692194586, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5602656573, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3963410286, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.6131661903, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3905898585, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5498108215, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3343350399, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5465517654, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.4509623706, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.6276175882, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.4404175157, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.649940095, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.4429424771, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5915660675, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.418987297, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5748791698, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.202098372, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4110516731, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2970536843, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5186257966, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0740715445, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4314543453, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1290369606, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.456225988, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.0244593913, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1235182482, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4682275447, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1622106093, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5093553102, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.066471681, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3435083262, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1256067288, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.496956026, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1707705852, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5022008375, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1078475606, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4427230465, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0797339583, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4418411387, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0973598172, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3528893466, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0827317824, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3639966646, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1301287033, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.385283552, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3356633416, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0965691457, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3802997171, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1156401289, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4459978368, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1260148278, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4359566525, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.120222864, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4827998681, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1535037749, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4764514844, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.432913173, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.2521233582, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.4095908744, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6348509381, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.4095908744, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6348509381, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3182970444, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.595316257, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2154426819, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5620944561, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0867932999, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4201964133, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0821410657, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3969463878, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1897299381, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5086851538, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3833939462, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0829682579, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.384929236, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3630576976, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0744904632, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4111163206, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.43631303, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4174727607, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4278386149, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0861671109, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3696512763, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1289410403, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4486368935, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0882525219, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4377853722, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0534513757, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3829169125, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4024696873, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1538602933, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4391148259, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1007092756, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4371822026, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1147846313, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4651957502, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0713710158, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4075406301, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0846581996, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4509865769, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.1946966569, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0772718393, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4203683137, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0829135716, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4009694997, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3714280467, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0889905327, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4022940284, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0612660422, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3837677428, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0756907194, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4138725094, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0886663742, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4487646223, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1057442843, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.453718146, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4393340573, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1195053738, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.451213629, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2174835365, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4462746463, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2444399937, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4991016393, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3415556284, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0889084344, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3974812246, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.3961285597, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.6148751441, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.49237513, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.685375649, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.3996712648, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.6353525756, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.5115346945, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.7037574716, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.5396134765, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.7656669576, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1737495157, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4532559788, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1774329946, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.430712719, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1605265407, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4158012087, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0596357961, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3113976238, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1688287853, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4916588179, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2680102298, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5654883865, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2166540719, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4344921443, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2735429727, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5644723204, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2022332245, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5084057058, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.278351925, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5348467461, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3574583793, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.592411512, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3799465256, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6464467277, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.420650773, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6788513036, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3536718074, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6344846207, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4583059141, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6572591476, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2229272631, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5653789748, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0936226112, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3452056942, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2693093705, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5410704186, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2463476586, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5596851385, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.266398619, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5645550913, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2140322213, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5631214322, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1891762066, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4346170233, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.185053788, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4705108742, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0980716713, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4646043403, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1724657814, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4978075401, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4054983797, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6264774231, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4204505079, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6503146347, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4387071211, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6525926696, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.420744549, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6496192656, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4877513773, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.7197897787, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.2005111976, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5334791309, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.2489407298, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5212235893, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.2372464203, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5175129869, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.184941941, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5067677917, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3189223091, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5875084576, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.353500237, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5959879218, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3936136052, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6492198448, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3936136052, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6492198448, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3833310864, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6252821653, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3938668169, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6503960274, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.3598376609, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.5862251405, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.2114773474, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4102017865, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.3563982586, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.5378970485, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1510722413, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4359232973, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.3276244253, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.5817308767, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2971752224, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.6051336645, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2329856852, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5405751251, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2563564295, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5499025329, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2500653935, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5098952452, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3410035629, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.6673519559, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2786312784, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4836796408, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.4175668624, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5616829346, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.4205004826, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5674537639, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.4097432382, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5368112087, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.380217695, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5452668935, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.7281051247, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.7882997401, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.5806197937, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.7346706701, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.5793367581, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.6502428442, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.4855332614, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5299556743, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.5411953361, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.6689891795, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2555219912, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3799133205, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2338678621, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3682311524, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1173952179, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2209049178, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1892240569, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2804131085, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0996020674, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2144517459, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4093301993, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5127625182, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.6244631487, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.6931369519, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.5819726385, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.6970914529, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4412006373, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5296624609, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.5411953361, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.6689891795, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4577275269, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6747054474, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2538333923, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4589637948, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3508739524, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5533976154, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2370526644, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4471600746, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3315041466, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5307991157, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2766873691, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4414406761, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1720076757, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3723150838, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2465659486, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.568906916, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3039115378, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1548157555, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3242496688, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.4751132439, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6159319815, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1477219991, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.286852017, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1477219991, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2391308149, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1818060822, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2730775333, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1496597508, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2221350278, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.7281051247, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.7847983366, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3254455687, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4474512036, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.6230832294, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.70254087, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3267294026, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4510525483, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4855332614, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6448214025, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.4815092082, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5820265218, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.2388752792, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4120359949, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.36210097, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4080981511, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.316501463, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4251617362, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3692377875, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5093945383, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.5804511284, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.7246473808, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.5804511284, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.7282086346, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.5793367581, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6502428442, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1243018504, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.3295011624, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.5198707242, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6498183531, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.8482942955, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.9256238041, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.8482942955, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.9256238041, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.4732072478, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5833006007, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3556521384, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5948308114, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.5406964704, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.596459533, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2575863752, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3717184744, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1358581334, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3021348975, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0893927012, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2952752522, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.216291148, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3542320138, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2199335663, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3822901361, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1221286555, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.276049295, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1580460695, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2486403592, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.2246029758, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6290393497, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6290393497, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6290393497, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5581982021, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6290393497, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4379538199, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5881561249, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4667095722, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3754432474, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5293274846, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4121323135, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4043598708, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3425668387, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4147702817, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4043598708, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.396188029, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3985861327, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3818534927, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.364411248, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3898236605, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5042211795, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4425973012, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5118761227, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5118761227, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5582360999, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5516607623, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4716061611, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5256353513, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3765697091, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2534743707, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5971149415, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4576529536, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5309982647, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4726395749, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4005242819, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4214137028, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2460137258, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6374693501, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1892240569, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6151179643, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2460137258, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6869474337, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4746119151, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5833743057, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4642659596, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4123810027, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4123810027, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4806367958, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4326969206, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4108469458, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3990998963, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3991370902, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4044335714, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3990998963, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3113878808, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6758978745, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1718152967, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5293474686, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2357831604, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5821373704, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1452867953, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5149523169, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2289415686, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6314372537, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2887138087, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.6342291346, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.7013062757, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9303769449, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.23816585, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.508747354, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.7647955332, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.508747354, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.7647955332, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.508747354, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.7647955332, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4741000223, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.7538467008, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.5738396575, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.7983571334, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4818114945, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7675828789, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.5091224919, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7829685247, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.5091224919, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7829685247, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.6626129614, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.8597893118, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4818114945, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7675828789, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4047272002, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6681898018, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4027672046, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6529271691, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4047272002, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6681898018, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4047272002, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6681898018, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4489771072, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.686224909, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.5379348325, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.770376611, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3018835387, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6086565368, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2239152297, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6087618281, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2704091954, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6207272323, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2704091954, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6207272323, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.5091224919, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.7829685247, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.6026286935, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.8025775976, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.6626129614, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.8597893118, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.6626129614, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.8597893118, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.4818114945, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.7675828789, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.589661355, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.752891475, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4596980088, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.713787746, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.5300714513, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.7461630751, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4596980088, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.713787746, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4596980088, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.713787746, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.4801289745, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.6766690087, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3272712268, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.6272846474, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3272712268, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.6272846474, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3042148589, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5662363924, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3207873973, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5817366082, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2848931828, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.576432511, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2981792161, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5788026001, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3942058093, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5878575558, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2981792161, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5788026001, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3485799123, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6090575372, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.6471892368, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.8142499722, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.7012294788, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.847811572, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.691790174, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.8479928839, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4020247735, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.7469480084, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.5091224919, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.7829685247, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2371332025, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.610684297, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2169036581, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5384773679, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2311466382, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5786592585, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2212877653, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.560943925, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2212877653, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.572263303, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.6888365053, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.8656273481, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2571138654, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6088853752, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2571138654, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6088853752, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3416581331, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6578570934, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3060368951, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6736142285, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3263040637, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.339038739, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6170420597, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.3142665434, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6466526067, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.3751840463, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6279894553, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1926847964, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5513970749, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1946452196, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5838790967, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.5014756678, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7958858212, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.6255340042, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.8724783049, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.5014756678, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7958858212, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.3083012996, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.658937639, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4302123694, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7142896582, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4899456142, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.7411155087, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4899456142, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.7411155087, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3236579503, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6509517796, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3236579503, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6509517796, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3236579503, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6509517796, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.4101479465, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.7041976254, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.4547900039, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6541971429, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2919394074, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5957961315, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1753767087, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.480088967, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.33828653, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6408187444, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.428494509, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.716402644, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.5950922113, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.7971172821, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.483123361, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.7122562458, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.483123361, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.7122562458, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.4207937381, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.6985308026, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.6511582134, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.8600023705, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3226386416, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6824395077, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.4896430867, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.7719180937, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3236579503, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6590438072, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3226386416, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6824395077, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.538368094, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.7860964064, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.3830597818, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6061131723, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.3463680071, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.5167955767, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.3675667566, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.5397693417, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4803501445, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.7417101158, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.4222184785, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.6656008733, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2404786079, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5819897904, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2404786079, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5819897904, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2404786079, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5819897904, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2404786079, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5819897904, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.4481489512, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.7994721822, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.387540775, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5985033329, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.5124776603, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.7722874801, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.179052784, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3725729545, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1552160603, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.376453294, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1262042989, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3558070379, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1287222063, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3360263395, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1446578398, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3030283215, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1418524086, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3829577077, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1526801905, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4102875762, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0308601662, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.1100250144, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2125532771, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4327215157, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.175608616, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4284862592, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1738234764, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4061580778, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1386817294, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3094469764, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1036185485, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3277480271, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1518696932, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3458120002, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1551417935, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3762636488, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0943129772, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3616856339, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1109125268, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.2660763461, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.1897170832, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1026674747, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3364703639, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1532505429, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4125406717, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.145578084, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3659834676, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1815495479, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4557483776, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0689753389, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.2776666563, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1665765483, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4017968725, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1052201444, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3254405154, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1678010916, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3968694015, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1381751569, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3121557499, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1579497466, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5092928546, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.162868761, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3422914837, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2489421388, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4083799714, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1169764262, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3711775364, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2006511507, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4084885616, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.1762196387, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0991614609, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3121110161, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.156345665, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4110013716, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1380561569, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4078799873, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.122912191, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3448002181, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1764307831, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4075758479, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1989414239, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3791567777, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1947336505, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4169850144, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1914828287, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4707949702, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2060857231, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4704943906, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0818335366, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.2500763339, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0981642546, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.3179322233, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1643920943, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4076099284, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1215724157, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4080990098, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0854164839, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.2825804067, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1041529816, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3345263292, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.2120423927, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3846197304, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1869333815, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4290809947, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1643188797, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4088971379, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1145250892, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3212742401, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0821835945, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.2390539176, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1767383562, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.390208518, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1960939563, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4429882447, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1518427872, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4093399938, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1547822267, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.355058476, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0624444512, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2823983493, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1568563265, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3437829588, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0826693165, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3127511921, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.5989315087, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.7353063746, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.3067706489, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5308555945, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1327526848, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3785060249, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1840503544, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.414290109, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3381363586, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4262221594, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5886657415, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2866084411, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4579283646, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2586113059, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3945264409, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2037925062, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4108541431, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.1691326883, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.431864811, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5792139687, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.3089009202, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5553909583, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.3089009202, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5553909583, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2579872309, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.524485423, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.3089009202, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5553909583, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4609261192, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6365915339, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1690979933, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3751861276, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3344305109, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3701750146, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2283032715, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4341368545, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.5234484809, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6658297774, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2840563957, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5110250591, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3000750469, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5153810823, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1407495777, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3750035199, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2543269102, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4829947079, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.3815250265, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6516314752, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1992041348, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4253779693, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1899029242, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.407218439, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1871026059, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4433431372, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2049841563, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4155916631, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4000381043, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5899097408, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2040179688, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4331763045, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2097387762, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4966330151, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2706716802, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5439625482, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3337338879, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.550089922, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3804753173, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.494857231, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.204488707, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3847158513, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.2309552735, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4672309378, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.2988665867, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.327060774, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.448923596, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5934678825, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.298050419, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.510126892, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2880086933, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4934867862, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2429163097, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5044329486, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3205104057, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.584870798, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4683276331, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.8176110135, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.9436043262, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.988019168, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.0067104199, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3642482473, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5342538783, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.188319335, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4318025704, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.4439623528, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5309137919, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.2628849077, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2375594795, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4291541973, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.284061369, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5649283064, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2154402759, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5040038441, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2855212789, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.1644894761, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2364455179, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1855954214, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3804842883, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3536937539, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1308768293, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.1946295298, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.0135384977, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.3375178722, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4840651439, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1512218921, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2675011051, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1075992769, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2106579454, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0784377299, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.1324578892, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.0816397707, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1617131493, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2876418496, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2168548583, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3714219747, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1227409298, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3385513652, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1463197333, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3661372734, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1265649403, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3156355831, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2496001284, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4448983036, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1122890322, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.1772610005, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3101771609, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1427671612, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3191375425, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.0223039199, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2676522616, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4201493552, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3710595253, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2168828306, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4177582416, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.182352473, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4077952398, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.0139152884, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1949274978, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4345593627, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1266637216, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2650373529, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1216277939, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3228288841, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1649662542, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3466546857, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.0153696674, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1588436203, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3981499896, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2032648426, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.2922087191, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1823759948, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3740403512, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.2244748716, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.0072819069, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3662268411, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5409038674, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1740044679, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3637515238, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1287668952, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3253153379, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1326935302, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.2899808984, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.013575256, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.2592282745, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3913113625, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3227889517, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4026302132, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1191597493, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.2129794266, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.140502651, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.2478525818, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.0223039199, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2791576982, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.369632421, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1692546646, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3591239885, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.2036348471, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3472831656, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.2154769743, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.180399603, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1464506683, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.348347983, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2327080491, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4213315211, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.2436235351, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1400583077, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.2827131457, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.0194337786, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3114449377, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4723803506, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2568191876, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2813584915, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1358560869, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2460209347, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.0147491229, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2390985318, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.6358921903, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.8041899227, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.6299285159, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7993134129, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.710159574, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.8462481748, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5487830137, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7723896504, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5375319287, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7826716937, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3505907645, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4021980348, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.4131612771, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4430321339, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3993284843, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4224738565, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2908087026, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.34113614, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3686151885, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3858999291, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.8780634321, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.9269467001, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.7964573358, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.8458636472, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.9452996323, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.9463396364, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.8781548422, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.9156314785, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4067397119, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6897190926, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3707525915, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6481906762, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4405434566, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6872423435, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.340705194, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6376396417, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3134536528, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6269464695, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.7033737197, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.7784050705, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4699587339, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.584375606, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.6034601376, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.7074074363, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.520069265, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6586847274, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.5176708393, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6443244311, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3489926819, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5715668842, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2786169605, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5267252236, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3544632222, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5208748527, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2679728612, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4666913728, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3244555847, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5576074375, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.341024469, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5816669417, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4234343012, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6625289906, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3885765192, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6554470157, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.381088643, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6485553379, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3602811871, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6460863746, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4324680012, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5877600879, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4493940084, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6230960824, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4116575553, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5665759692, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3533147318, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5972951641, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4771981138, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6315763749, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.6947677374, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7941300667, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.6412098672, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7665040244, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.6045639361, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7576570568, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5438238038, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7060850658, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.6197738787, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7658055016, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3861375213, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5122109329, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3253992126, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5133457276, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3750795127, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5371301483, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4845646373, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5906105669, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4092755331, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5662949759, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4354194543, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.665617533, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5941815558, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7983203559, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4524360013, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6715594087, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.335542878, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6348737823, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5203658198, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7286515973, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.398304592, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6521777109, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2682038772, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5791297455, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2276653674, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5321260121, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1498185575, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5073561651, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3776712971, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6263797337, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3880515885, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6587916716, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5142726846, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7344716263, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.6066498621, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7812137754, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4342750765, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7115011222, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3893969298, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6629460107, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.4487746168, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4476730201, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.28366234, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2914733724, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2775905064, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.316576728, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2891243295, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3111960394, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3679317258, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3623820326, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2113054108, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4423822999, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2620790359, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5007312322, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1609807304, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3971037508, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1146562315, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4497512969, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2035086444, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4226564278, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4556160154, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6661994452, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.321675602, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6141241026, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4336904847, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6586872889, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4098419225, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6358736384, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3916220735, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6550784354, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3757080934, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6339141735, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.5593324226, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.7332911901, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4845738245, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.7144409873, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4881942815, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6662053432, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4577386766, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6531477301, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3446592077, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5819912584, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.232709381, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4490269267, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.1163446833, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1766119945, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3986479587, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.365728408, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5794132414, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5295277583, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6540432511, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4970423291, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6453248294, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4970423291, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6453248294, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5494410974, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6853937472, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.464523041, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6240758264, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3479698394, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5760833126, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2437325371, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4948203921, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3120506351, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5390444512, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2422988979, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4853505496, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2759710526, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5468536897, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.298869704, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.544252266, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5007036357, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6501904887, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.487646318, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6113405964, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5199813504, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6584629523, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4743196503, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6291489876, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4333022325, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.556449953, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1466607446, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3655296382, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2052749403, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4358647505, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3047577636, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.483185127, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2580795409, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4391402666, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.418078222, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5775458912, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3475258894, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5729813197, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4610791065, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5982792042, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4642320267, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6555816107, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.0007348618, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2023879631, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5665467523, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4612469192, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6895404842, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4688149932, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6935921005, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3190700151, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6396787125, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4257525491, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6704469753, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7017829861, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7743327022, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.6961795372, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7859480663, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5643442092, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7005543453, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.543231275, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6677259865, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7108042923, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.8180084375, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1411835006, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2043183778, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1811004938, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2649993137, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1408901109, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2194460381, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1250181903, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2634990041, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3107963896, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2072192435, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3647593219, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1138660795, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3356458335, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1686235632, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3637462812, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.1485432117, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2759460538, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4266832189, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.464426437, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5519480629, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.626894179, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6958291103, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4554740717, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.549876635, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3581781081, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5012707041, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.6297960259, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7117676662, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2283768002, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4416418023, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4151474543, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6389524687, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4355097603, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6511365998, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2468185992, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4679216763, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4295348441, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.623113134, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1163412939, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.315309023, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.195447958, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3835451744, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.198893335, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3885583773, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.244801029, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1768354493, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3684372572, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.359355104, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5589602235, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4267520229, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5518115367, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4248870612, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5641041633, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4042942963, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5757999868, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4538153281, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5943177067, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3555103419, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5627284646, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.5039752491, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6136695013, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3693229588, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5524455185, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0803311992, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.2302164129, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3284978808, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4983088157, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5088535943, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6252025968, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5620488199, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7192054484, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5550041554, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6554946147, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.440689626, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5713280637, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5530531361, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.756238556, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3941975149, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.519104648, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2626339401, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4192320655, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3850172427, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5264633431, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.1536323419, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2697691813, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4379048206, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.261816185, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4694658943, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4395347892, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6124294443, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.337115074, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5683831732, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3222423456, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5643748238, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3260557929, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5464327823, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1313941359, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.2490406851, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3112317272, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.436159773, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3671734945, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.493827516, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3267949175, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5061357552, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3784649355, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4712244356, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.8761560783, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9484564543, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7505336183, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.8401910628, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.8761560783, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.92894163, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4450050658, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7558874882, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.8107492451, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9000327478, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1345392715, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1052297427, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2205549369, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3931965049, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1375527487, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1039771531, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1389994121, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1094730342, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1372586106, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1114738485, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.6885326215, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.8229812189, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.8395876231, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.9096086669, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.7267072831, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.8396959978, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.6374950652, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.6643984253, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.7608566263, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.881580297, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3480442076, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6142483233, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2861853478, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6401604433, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2861853478, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6401604433, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2852636439, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6732018003, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.1840992999, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5294826056, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1740151771, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.450062616, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1512404438, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4224869588, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1512404438, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4224869588, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.2686001166, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1417229241, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4762857001, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2028736642, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.361485664, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2255489037, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.395492575, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2927057122, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4330945753, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.18038303, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.320678468, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2721438001, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4053920466, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.2929807168, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.597559507, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.6689604664, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.8010329765, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.6689604664, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.8010329765, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.149089608, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.4761746966, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3077874158, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5260758147, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4113125177, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4280807576, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3268514139, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3758692874, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3734832063, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3839166952, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3804672237, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4337083419, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4171995809, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4623764371, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.6237774736, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.8500131525, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5737647229, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.8179798595, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2320305803, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6224956013, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2144945948, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6528501353, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2244975801, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5326826664, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.8482942955, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.9256238041, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.8482942955, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.9256238041, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.201640652, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.392353398, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4212555585, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4426408937, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2750774388, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.3471215691, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3132288506, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.3821582739, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3286610737, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.385722787, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3471790743, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5354826965, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1452867953, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4562626418, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2114623992, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3672220684, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1136535202, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5427832684, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4062083693, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.2246029758, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.4765874091, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4591155777, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.4502212538, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4687426738, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.6350593429, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.6022395695, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3407065042, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3482814151, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.7215691881, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.7351007898, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3013901676, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3810601296, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3518774507, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.2850647115, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3190905975, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3820562307, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5488313413, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3809137042, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5405504436, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3820562307, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5488313413, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3631474834, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5392658386, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2293530952, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4689601315, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2294068721, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4045836405, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.3258864375, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.3200317028, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2308824748, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4093450186, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.232779904, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4150815685, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.4523791233, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.6299071574, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2373681044, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4004852416, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2916261379, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4106520927, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2827647331, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3743678965, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1100868155, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.297203493, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5605065819, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5868532678, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3630029634, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5816676674, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.352539976, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.579811697, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3927053213, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5108598155, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5369357392, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5869601651, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2876540853, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4046608868, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1819722649, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4425473022, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2529183169, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4482360279, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2796002691, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4817204985, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1708721495, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3646964804, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1330519954, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4324498727, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3377385621, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.525612845, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4477604756, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5801193948, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.287558382, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6087635831, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3569375456, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5492415189, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1254691277, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.2651343524, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1240721616, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.2664864612, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1126159789, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.2523482734, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1275785595, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3385577202, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0841173493, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.2901271494, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5322520826, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7271316675, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5266403878, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6838125749, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5276151436, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6871514991, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5276151436, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.699912443, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5322520826, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7271316675, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2092659579, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.535476676, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1284866897, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5495968221, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3099627272, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5376391724, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1574248334, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4351951744, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.5074919773, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6528956125, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.2887138087, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6342291346, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7013062757, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9303769449, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.23816585, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3758990206, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4255415128, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2074813196, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2716205232, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2074813196, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2716205232, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1927292346, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3145892043, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2074813196, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2716205232, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.4298810543, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.7577244658, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.5366411242, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.8255664943, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.6179396438, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.866516296, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.4360038791, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.7669087485, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.4563369808, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.787353904, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4165530721, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.702780513, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4027788022, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6872835607, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4024582794, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6664090182, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5552412315, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.6976333496, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.8331572108, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4130732371, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5785653392, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.5248587176, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6664855309, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.5248587176, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6664855309, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3279713812, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4864562825, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4987046236, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.647874639, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1772984226, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4103582048, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3489583637, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4767378359, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.4010889715, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5642546048, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3014528044, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.472975393, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2199206296, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4070442354, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.8958039312, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.9382091007, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.6433799262, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.8103769737, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5403356451, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7639130574, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4500531895, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4302706554, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4933292241, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5225247298, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.234878114, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4062284747, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3763743474, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4017565065, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.5135063581, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5263652477, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5212982931, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3531901509, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5822934956, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3531901509, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5822934956, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5095895502, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3532802306, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5839265502, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3855522726, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5872605669, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4426623527, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.636837103, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.366634099, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5782960279, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3289267652, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.580076131, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4655035539, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.6467306329, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.1965085477, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5134302168, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5187615227, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5205634208, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5187615227, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5287371836, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.5106109398, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7688046995, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4477845944, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7043336945, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3221411249, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7794716829, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.556499296, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.5129586382, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7857394056, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.3263040637, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.5561195823, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.5362935676, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.5803515898, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.5422220469, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.4204739941, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.5173824079, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.4177866849, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.5243375045, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.4593860924, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.5045746405, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3343829907, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5409759573, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3785406892, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5743796566, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3785406892, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5768306472, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3213450436, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5076725974, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3075951598, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4988668236, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4550680331, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6477506541, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5923136157, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7382416556, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5923136157, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7568286018, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5521710658, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7317828776, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5521710658, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7317828776, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4018202851, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6003256952, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.5804511284, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.7542976177, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4018202851, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6003256952, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5263574469, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.5582486914, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6678493404, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3771745743, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5554130492, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3159892348, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1895316299, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4587674595, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2383770505, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4666458696, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2556795749, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4561555898, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.7629273293, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.8510385545, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.8725129388, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.9495292424, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.8725129388, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.9094153226, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.8725129388, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.9495292424, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.6425503167, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.807889193, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4934916371, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.694445271, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.303764309, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5183662698, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1837671115, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3981272326, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3409605607, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5217663813, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2989898445, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5359750729, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.8253498773, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.8529564805, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.7944837206, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.878453174, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.7944837206, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.878453174, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.6941268298, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7679844671, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.5828833474, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.7908226509, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3869431776, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5953878513, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2620499196, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4893724002, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2212877653, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4999323991, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4272870064, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.6271734609, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5040673596, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6469962279, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2281684904, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4984990869, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5106109398, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6635467153, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.325909498, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5501364765, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.7498810286, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7726337965, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3954948172, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4821021676, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5029543425, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2254310841, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5721164466, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4884391792, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7050595168, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4902350231, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7638414724, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4424906783, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7055079713, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4145278784, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6973605664, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4103230277, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6634154487, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.6380575768, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.824567364, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0786010539, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.0967837769, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1160114131, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2167118757, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2390076355, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3357015413, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1371661844, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2345567914, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1809155303, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3604670694, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3501522472, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5701648579, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3349252033, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5908087432, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3258812298, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5753985305, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2883113323, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5835478395, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2347500093, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5032853946, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.344905813, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.536561983, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2968884568, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5494319015, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3257602417, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.566659654, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2251114029, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5538390232, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3029863251, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5652374403, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2537603225, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5334329404, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2003914161, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.3612331209, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.0564437248, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1502603746, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4303467795, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3275231027, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6168686838, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3270769537, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5166643607, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3069937936, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5024648106, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3575909322, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5409483829, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2228729825, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4466759653, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2662960357, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5253549609, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3927237742, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7451438087, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5570357635, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.8116469942, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3508597297, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6833592152, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.2125947044, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5863866794, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.443404947, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7587103444, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3826576187, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6071841372, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3447241448, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5531085141, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3178743908, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5513949312, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1883251048, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4530322538, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.0192989769, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3112863571, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6304411194, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1330856181, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5312476702, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.257912492, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5545120254, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1595487508, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4511156609, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2369305576, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5928508276, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2879556779, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4554184077, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0957892195, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4047288792, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2296566982, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4624781939, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0892095247, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.322418757, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0659828829, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3008263307, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3872951671, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6571482446, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3299562825, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5982616321, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4381454708, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.616374622, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3614922712, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5698489013, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3957463069, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6093311945, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3665528144, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5966563048, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.258729775, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5132023402, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2914897523, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5714769597, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1115093771, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4170915413, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1206120707, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4663892484, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3480079866, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6148736551, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.312222584, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.5549937871, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.2706573913, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.5619563044, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.2133109831, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.4766025973, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.1985082374, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.5129122522, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2368307518, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2631328191, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1645539243, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1367388582, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.0528214025, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1072112607, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.4615978016, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.6280777654, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.422429895, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.6082308552, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3916177036, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.6068458203, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3045125886, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4983778741, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3916177036, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.6068458203, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.3676904072, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4064141882, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.3472289737, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4103553163, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4155938131, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.328671194, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5944310795, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1354727734, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.483018962, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2297009209, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5537467827, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1354727734, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4685134393, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3498215109, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5324168516, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2822535302, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3874773379, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3174769726, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4079777866, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2822535302, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3818556455, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2822535302, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3785761837, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2822535302, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3818556455, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4693593336, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7730555735, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4336894555, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6409951781, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3681829215, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6273930299, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4389321784, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6468470369, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4336894555, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6805799636, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.316021361, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.516561467, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.307587447, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4684197705, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3716923706, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5383668332, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1865526716, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3640275544, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1420081588, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3704326476, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2961516536, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4980392435, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3459667619, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6170810606, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2362379063, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5441149449, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3593699487, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6492026441, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2989025113, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6058743572, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4683276331, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.8176110135, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.9436043262, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.988019168, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.0067104199, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4593546098, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6086021462, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2338678621, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.466629299, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.1634124231, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4007254932, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.1395211838, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4030284875, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3419664739, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4989057927, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3397180517, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6494995649, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2381198934, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4812080785, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2316879948, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.525267212, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2889285495, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4536746865, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4136211902, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6393493535, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.6031612036, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7362867034, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3943234482, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.5943452555, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3443768664, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6090402109, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3920558089, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6772940234, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4263005629, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6665768162, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1125439789, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2062328899, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1100081929, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1896706167, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1077233201, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2360903687, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1498435849, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2105170009, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1148374893, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2218739144, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2449339028, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4811362511, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1947668131, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4203040773, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3360050269, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5162346122, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1033604925, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3088863285, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2176929795, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.454042834, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3459789902, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5620330456, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3782571349, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5584414289, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.369537503, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5568751295, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4792316814, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6534660189, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4200122603, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6060665796, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1845747513, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4437997152, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1821246362, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4695925404, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.20734617, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5036833881, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2817686971, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5170853674, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2701727285, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5162766223, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2517176763, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.451373445, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3128384317, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4801627921, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3508847644, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5291980445, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2674628639, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.478429215, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2643715067, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4590454051, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4320063812, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6892273788, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3411951585, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6539473951, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4737246708, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7348004695, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5582838438, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7625459507, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5641401219, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7505430817, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4047570083, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4349871721, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4749702454, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3805666011, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4158948448, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5244380104, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6914581279, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4472834999, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.645713027, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4034697489, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5836273992, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.452120997, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6307076431, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5201565256, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6663170491, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.5041542875, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.6074467585, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1877181603, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.375941608, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2828480467, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4330386622, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2631417381, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4194315681, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3180687408, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4375097637, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3368441656, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6173496967, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2105458851, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5020237474, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2108312271, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4950405689, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2259358117, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4781181087, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3653727003, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6006612018, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.112836786, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5027560731, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2943290953, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5637465581, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2066516314, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5424961082, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3720123244, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.185863022, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5550584876, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.403061835, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6065077242, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.3756985487, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.599144377, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.3437925129, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.549615844, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4457795439, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6608358312, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.5013226549, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6749353854, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4892530409, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.6697286007, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.5009456904, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.6893719644, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.5011800955, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.6882325338, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.424511135, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.6326418046, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4307886338, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.5983383363, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.4986876043, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.649557701, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1827394486, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4426186519, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1921021634, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4109063493, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2019984491, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.429696162, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2355500146, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4328470749, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3897372021, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5520780806, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2153742038, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4581737689, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2258331489, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4634872124, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2000682107, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4221394795, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2221644328, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4276459077, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2775751477, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.546740784, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3372953649, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.548250538, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.359804125, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5672133518, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2757880829, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4682894377, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2898775882, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5097463472, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2988083057, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4973008563, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2852890535, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4885812318, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3579736298, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5379266632, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2606045001, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4525313379, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3739173814, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5300063373, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3512050938, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5127991323, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2935204022, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4867597973, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3639469, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5567484828, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2787040884, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.486893586, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.303649574, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.490461471, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.491328688, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.6524450167, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2929684585, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5038324436, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.341417164, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5306256203, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.3858101625, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5618844078, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.371873106, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5079209956, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2710678414, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4582877456, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.4034224234, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5736798835, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.4711759071, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6157183059, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.484032906, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6570537612, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.5211295958, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6543358671, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2822871797, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.520891503, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1077205147, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4283381456, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0954366751, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.405189985, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1408702259, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4275237095, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3077490672, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4982442692, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.4102082155, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5474039588, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2232776795, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4063556881, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2623485199, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4686295192, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2247203214, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4363253004, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2699962663, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4462786481, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2242445367, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4163744411, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.25727332, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4520014139, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2311264429, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4228120751, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1733396766, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3715761436, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2788402943, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4808977586, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.4016505306, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5837756195, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.40311197, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5788525109, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.3091271358, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5376618149, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2280007166, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4763467107, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.4274089004, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5996769756, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.4987219594, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.6907054265, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.4531357898, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.6160993562, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.3764064622, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.5429063669, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.4331983607, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.6016623009, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.4931039911, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.6618877666, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.3411271681, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5323123267, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2651736858, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4491383344, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.308208266, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5077609646, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.3215106481, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5058205933, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.3292501962, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5076613848, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.248284306, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.5078550623, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.3454531996, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.572705286, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.4256604039, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.5952544825, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.3594882998, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.5639910704, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.4383332081, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6068355218, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.4381699513, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5887410281, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3896886796, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5581403039, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.4437827937, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5825113284, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3409306042, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5050414553, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.4312966248, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5796681637, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1772747397, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3475071695, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2045141661, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.381852854, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.246780308, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4463603006, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1773614249, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3654025503, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2073997043, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4243703395, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.5494025263, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6860161544, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2636405083, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.507200947, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3994138414, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6335699197, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.324408202, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.581602476, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3433793467, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.531256118, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.4222656487, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.6421614792, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2017417362, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.5179166118, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.5116634146, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.6950231685, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2772024607, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.5433539614, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.4509728065, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.6500555759, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3531793316, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.5558881348, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3352283336, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.5341959299, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3279338214, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.5206722319, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.19002495, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4570054063, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3417785003, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.5213383974, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.4397415107, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.5907735811, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.3130882423, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.4950165424, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.2864658402, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.4746124656, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.2124053523, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.39859173, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.4261122399, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.5780599655, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.4689079644, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.6445795993, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.3070469439, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.521746887, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.3675770738, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.5833872029, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.2381080413, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4678770958, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.4648698751, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.6377045673, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3538966479, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4179644538, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1111609137, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4330740108, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0764997889, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4103166432, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4342201553, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4375922921, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1050510646, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4474870049, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1153497657, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.467613299, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0487561532, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3938156292, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.435016773, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4239838444, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.0009218289, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1488374684, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4476843235, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0799981999, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3889987133, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4518285011, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3374178992, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1565385979, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4317779805, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3848892679, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0592815464, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3161457142, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1550056038, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4433773218, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1010643984, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4445092648, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0891537192, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3970634926, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0799284495, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4400081801, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0955468154, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4142248559, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1018099322, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4132076508, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0523591033, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3805982553, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0950136506, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4372017487, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0946260954, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4353772493, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.1571451546, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3917510042, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4404222773, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1259356761, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4456827452, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1643146815, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5127730105, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4197215835, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1355093777, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5030190997, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1083397187, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4467303749, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1632249418, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4815584994, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0889465243, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.444906007, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1029835797, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.440451876, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1296992764, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4176676149, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0946382889, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3398200805, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0904087253, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4183051317, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1823776118, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4897620962, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1316088195, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4719647515, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1965214861, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4627668713, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.172081413, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4542522451, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2135190266, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5130443042, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1055317928, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4283144779, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1081470635, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4216597037, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1128334543, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4205902028, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3876375615, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.1626998642, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1196063679, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4498565343, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0653039796, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3689954584, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1471854548, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.460257245, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.2398247113, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.0693983815, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1384529883, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3827779045, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1162066331, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3781611496, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0872069557, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3539397058, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3544628607, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3371547585, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3473356627, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3436708647, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0752835937, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3929787161, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0967623049, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.432663695, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.1691386174, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.492078934, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2633720088, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.5332559902, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.128203556, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3621325952, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0962657473, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4247768565, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2356661679, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5124350706, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1494443252, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4972796479, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2128223811, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5048999729, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2159761643, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5016920564, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2025321568, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4851328772, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1072039195, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3721960528, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0979331693, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4297577432, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1046199321, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4115395742, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0923287541, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4057472974, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0610671152, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3575665488, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.068517235, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4091114966, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1418499891, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4449815965, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0986847451, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4007829842, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1245953936, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4660673682, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.436501506, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3674193701, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1122045089, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4612996284, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1495364895, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4736386375, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0999644661, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3817082202, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0638705439, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3815759231, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3275292968, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0893298382, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3746213289, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.121516839, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3874631849, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1020494145, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3642762802, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4198632526, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1383193561, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.422971772, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1484639283, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4493910326, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1214642415, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4236242054, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1094074966, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4056454797, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1522082246, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4115596298, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3539070801, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1134012914, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4168800407, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0743868134, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3894532191, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1228901286, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4301477375, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4226914212, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3241317524, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0735165222, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3862617014, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3822492761, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3775429523, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0978910021, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3998935506, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3499024159, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1258730141, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4327857303, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.0807285976, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3683463348, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0780186217, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3649626949, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.395791121, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6431490866, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.381895674, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6154314826, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.3436153961, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5954254643, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4339219137, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6338401824, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4867425155, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6949024222, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.3525333892, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.6487975155, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2126707921, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4659908461, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2914880531, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.5962886968, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2394466657, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.510650924, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.3157230364, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.6026946145, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2451341489, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.547664761, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2324010239, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4973274283, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2516768028, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4724978187, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1610526599, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4043773717, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2920934314, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5778663411, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2865352864, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5053636612, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1797938473, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4177311931, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2767429729, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5118375022, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3192837057, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4886865885, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3800528767, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5075280145, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3132694642, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5911719769, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1702602472, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4366640708, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2615659486, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5126931978, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1840585956, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5282240694, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2435840338, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5152157452, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.5294442647, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.7281375073, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.9336510696, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.958650753, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.9336510696, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.958650753, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.6337520241, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.7734740774, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.7096224668, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.8862932371, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.416291599, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5970097206, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3816408219, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5784105768, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3923434274, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.597218609, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3612508194, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.610598826, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.4631704105, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.6800890175, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2584847655, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4897308313, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1839822664, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3728501053, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1811683074, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.378028437, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2539169853, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4294871149, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.4041338117, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5261706483, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2985169054, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.622420986, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2695888454, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5631664733, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2503955136, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5411247834, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2611502134, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5520240492, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2783789933, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5673065269, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.297969127, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5158892363, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.4005296398, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.6201785377, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.4005296398, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5910864031, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3114493864, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5682352099, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2782453336, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5540161526, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.173772616, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4342710498, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1595648358, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4256934207, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0979157953, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4043298644, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1042356347, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3439000682, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1751312977, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4777391919, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3363139801, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.6332428715, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2323385181, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5019509292, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1972647242, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5084335266, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2289796737, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5158963535, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3061554451, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.613003519, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2453238227, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5501708058, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2295217731, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5279520953, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2950615457, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5675143775, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1864340365, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.504828001, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.3466720379, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.6312259441, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2063529291, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4136424802, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.3618488169, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.5708179622, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.4453684683, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.6266013058, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.4528624345, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.5635810888, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.3548439094, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.6152611696, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1058614013, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4674053478, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1712766252, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5225554963, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1549337617, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4706378089, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0875931037, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4119714832, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2451791783, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5630094449, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2703645496, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.5129310433, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2709079038, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4474580194, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.270750755, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.5079958751, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1913449287, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4261251088, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2845070198, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.5183351563, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.2492031334, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4923163375, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.2907608105, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5445465035, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3021915703, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.549228869, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.2166046272, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5246154268, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.4173623672, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.6539468166, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.4310450414, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.5953439402, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2790718869, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.5093017177, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2276330877, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4328919789, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2865267928, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4341260827, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2951278924, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4907465238, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2086398446, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4587980194, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2695149222, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4713033965, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0883991405, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.1321004694, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2266962937, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4780713177, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3497701087, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.5444479223, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2733878926, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.5429269981, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2075953797, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4344742362, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2938167712, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4842449941, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2063529291, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4812376698, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.4173738681, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.6106512856, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3703971547, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6509854049, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3020089249, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.566679124, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3169340576, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6047772126, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.2728224725, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.5858336859, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3468503425, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6177731406, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1515551103, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.4945579176, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1059786102, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2561557977, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1550710073, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.483224092, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1488909539, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.4153640076, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.3800528767, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.5867504755, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.2466475164, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4870238348, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.2103019562, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4375454772, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.2139607533, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.5173735729, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.2294179787, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4218698188, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.3268780818, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.5888362088, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.5804511284, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.7246473808, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.5804511284, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.7282086346, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.5793367581, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6502428442, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1766290326, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3595736267, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.3082642374, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4128975676, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.5835260168, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.6994652194, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2740561286, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4639958592, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4390960898, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.5417421788, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1323229159, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3019016697, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2682503411, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3763062102, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.6052987577, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6436021707, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1300480047, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.2821714216, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.3924259175, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4505055715, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1060131743, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.2344095627, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1545007955, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.2510089623, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.4815092082, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.578525119, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3782148637, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4718665834, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3542398584, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4293667924, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2933705789, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3557011076, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.4155813233, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4683680116, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3869431776, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4582771186, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.369938226, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4032851361, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.4237819055, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4733550728, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3763278728, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3900945781, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.4092112922, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4452176798, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.4115167991, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5649900101, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.4516759457, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5169677928, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2706805631, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3818680661, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1890425468, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.351301969, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2245512943, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3153073205, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2448951689, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4093697621, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2338678621, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3780009827, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2669637888, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3581548569, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1262744724, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2526668887, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3595597536, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5042608117, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3989952326, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.3925121365, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.477885928, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.3542398584, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4401068256, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.1926368467, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1636811804, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3476956164, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1589651999, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.2951399946, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1423412184, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.2596718628, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.176159623, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.2443147455, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.3120848454, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3640187353, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3571150501, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5018967495, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3572188193, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4538117529, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3572188193, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4293706489, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2513073727, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3798674638, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2677353447, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3576865471, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1068282725, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.2155111731, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0742505552, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.1812234105, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1635267086, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.2640633398, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.149749592, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1064085069, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.1954606752, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2774527634, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4358323759, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1978585723, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3527599187, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3021375397, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4603540138, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1299191651, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.2788939261, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1076532625, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.2268211743, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.519930223, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.601748102, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2523019529, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4406369073, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.4195959936, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5643628666, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.3597457896, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5294218016, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2934521274, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4075394811, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.1923018801, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3407021379, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.4107267548, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.563558915, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.4122974403, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4981294586, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0981216326, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.2826014149, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2948629666, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3757242758, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.5804511284, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.6612342258, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.38833759, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4643731845, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1155664799, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2374832333, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2589451141, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3626530243, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1157064511, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.240912339, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.6064630666, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6712747227, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.6242817472, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.7123666275, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.5804511284, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6560788161, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2584145049, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4449478422, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2274336387, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4134707988, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.1472895431, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.2256490809, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3730033182, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.2488310827, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3329995141, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1382717572, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.2588011279, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1221966748, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.2405164296, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.7795149904, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.8912732146, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.6230832294, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.6994652194, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.3676308285, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4293667924, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.4372855386, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4380646029, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.3535749731, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4045670776, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.303890587, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.431089691, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3763278728, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4261526683, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.36210097, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4423339373, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3763278728, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4047854121, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3865695386, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3844238862, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.3902273664, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.5202587069, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.3672404085, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4518744271, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.3433270406, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4086391312, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.3672404085, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.432886828, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.3924259175, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4246539837, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.2538333923, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4612346143, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1640179865, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3760928912, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3175634859, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6126383724, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1535259784, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3544969745, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.2396621968, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.5164809275, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.178071294, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0784377299, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2669076053, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1291353308, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2521959501, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1080439968, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2472647721, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.2201844821, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2705349648, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.3029928207, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4526215373, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.4300000761, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.5073076708, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.4125656014, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4621663226, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.3512502253, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4386915774, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.174146751, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.2858414981, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.441049252, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.44291963, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4425973012, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4746507483, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.44291963, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3844263765, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3830425593, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3805770883, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3830425593, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3830425593, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2369305576, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6474126202, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1667955161, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5802683404, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1667955161, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5802683404, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5521590063, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1992340566, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6211036406, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3446073377, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.762169638, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3237722713, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7426638026, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3703046834, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7587397825, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5453111149, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.339237555, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7348936586, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2594750714, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.6659437948, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4934217591, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4754189767, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4684716537, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4215643004, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.195647515, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5725643788, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4352628824, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3620843367, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3550428473, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1884239372, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5854975501, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5753050684, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5116862202, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2213147799, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.6188310784, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4928989791, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5769327326, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5204725155, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3347161634, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3198143077, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.2594403516, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.297593612, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2961516536, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.7355780987, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2865612242, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6433813179, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2651812298, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6541173886, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2622067644, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6463231753, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2722589423, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6585715472, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4362060592, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3598792258, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.325832365, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3209186109, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.500271653, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5343147728, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5125809225, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5125809225, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5118761227, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4782537016, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.6245566175, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5539920925, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5539920925, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5633410521, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5963099883, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5326397959, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5226572947, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5226572947, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5210387657, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5309753108, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.5073395825, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.5073395825, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.5054194885, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4923304298, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4877445614, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3370934794, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2938259561, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.319663122, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3095023687, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3382125208, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.3222538602, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.7495871588, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1667955161, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.5773664661, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1624355753, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6732778878, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.3146660997, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.7749196539, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2369305576, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.7180407771, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3057729079, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3053963874, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3025031428, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3038662664, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3463770747, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4660343509, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4334093215, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4169735478, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.431892517, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4024251521, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2125884413, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.631489137, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1582128589, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6605676082, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.535205964, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4817621004, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1667955161, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6090533288, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.5700887051, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.5873831965, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4709927497, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4180569412, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.5317734594, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4823185396, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.373146928, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.412067526, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4669656954, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.412067526, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1892240569, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.5196343732, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.4254686257, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3088290057, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2898500891, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.2033344819, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.4539198581, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4271693186, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4458379933, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4456299718, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3948956358, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4568968866, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.5069487415, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.7801245319, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.5695988433, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.7516103468, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.6358974377, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.7366619371, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.5695988433, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.7516103468, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.8522456714, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.9096914044, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.7196315267, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.8835331637, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.5072784644, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7361065922, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.5072784644, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7361065922, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.5072784644, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7361065922, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.5072784644, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7361065922, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.4015773328, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6532350819, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.3809137042, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6438225862, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.313744506, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6422405833, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.4924584878, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.7062510643, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.3132768115, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6093422257, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.4818114945, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7046532915, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.5091224919, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7202697993, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.5091224919, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7202697993, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1943759863, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4968810396, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.4818114945, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7046532915, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3903594391, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.6662116837, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.691790174, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.8479928839, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.4727805713, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.7717158158, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3681601704, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.6630063658, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3745653574, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.6126780726, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.4719458928, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.6863265729, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.5309354663, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.6990707993, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.4338561264, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.6552557413, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.4719458928, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.6863265729, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.637202263, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.7346216973, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.310088227, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1673872929, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4506667273, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1673872929, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4506667273, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.310088227, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.310088227, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.5465526716, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.8012679277, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.691790174, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.8479928839, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2289493933, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5747669846, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2754532129, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.6280000881, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2289493933, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5883432091, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.7221847203, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.8931067232, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.3416581331, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6578570934, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.8492326636, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.9292326051, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2335769717, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6610479564, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2127002417, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6183813549, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.5072784644, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.7342525134, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.4797543511, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.7240781311, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.5072784644, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.7342525134, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.5072784644, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.7342525134, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.5420890779, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.7219273458, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.5465526716, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.8012679277, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.6401876411, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.7526484951, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.5184341074, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.7295047042, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.4252502464, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.6774296788, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.4252502464, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.6774296788, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3305712968, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5669225665, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3305712968, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5669225665, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3305712968, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5669225665, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3240220869, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5364140652, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4301823405, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.5468017145, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.7519227909, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.6004981752, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.7697646565, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.6004981752, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.7697646565, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.6004981752, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.7697646565, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.6004981752, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.7697646565, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.6179396438, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.8356543645, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.8492326636, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.9027320256, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.6179396438, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.8356543645, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.8492326636, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.9027320256, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.8492326636, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.9027320256, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2772093802, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4280471803, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3035069042, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2813985982, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2810748887, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2954873212, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.6281881652, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.7361567091, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.5691338869, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6834516952, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1680761126, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4597054186, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.334306348, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.542917167, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.450478099, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6386322493, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.2724974523, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5764878064, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3207873973, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.57798384, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3296512955, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5788023273, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.186096212, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.543850457, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1792334464, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5428745815, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.4814564802, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.7954823724, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.3742893656, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.7582803042, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.6316839256, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.8143078359, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.5069487415, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.8112065455, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.4818114945, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.7675828789, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.6028670503, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.8176176658, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.5386695403, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3788827324, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6841096204, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.4741000223, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.7538467008, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.6312184805, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.787428944, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.4741000223, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.6719386832, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.520657106, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.6893242589, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.3034437123, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.6219235057, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.215553788, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.55779767, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.4411997844, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.6860816819, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3984098807, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6360169585, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3984098807, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6360169585, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3984098807, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6360169585, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3984098807, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6360169585, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3984098807, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6360169585, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1715029616, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.4881295488, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.460769794, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3900016865, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3509453606, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.3156961171, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.5247546298, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.4168218947, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.6573099562, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.2852636439, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.5851048071, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1763647856, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.5283932773, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4203546552, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.4818114945, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.7675828789, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5512324462, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.429848247, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.7289444697, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.3737098172, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.683220117, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5582775803, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5582775803, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.6507561417, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.8215788698, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4881010345, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7317734492, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4881010345, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7317734492, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.6507561417, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.8215788698, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4881010345, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7317734492, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2719326877, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6002086363, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.428494509, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.7246227738, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.291702053, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6498499528, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.291702053, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6498499528, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.429848247, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7395804946, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3684981985, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5606332518, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3694816689, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1423071533, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.523427625, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2445665611, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.6532234058, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3201911828, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.7182383859, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.4536404448, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.8020827134, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5134477226, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.228313868, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.6930977636, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.4899456142, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.80841236, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.454509184, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.71660504, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2919394074, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.6265777782, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.434567376, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.7033881185, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3581864018, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.7236278104, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.4812700338, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.7668482136, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3370129265, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.7096874944, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1991040145, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5815343547, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1624355753, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.495296847, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.4530777804, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.6384504056, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4201902478, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2318507812, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5831825814, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.3748904745, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.7155230966, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.483123361, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.7807505268, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2697856976, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5736298373, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.3766019021, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.7318674194, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.483123361, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.7807505268, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.428494509, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.7246227738, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.5595205106, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.8322210048, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.428494509, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.7246227738, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.3942058093, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.6697898835, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.3142665434, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.6466526067, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.429848247, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.693430928, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2453392175, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.6569130291, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1946452196, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5760406199, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3610544299, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.491251159, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3610544299, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.491251159, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3733543476, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.538395941, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3610544299, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.491251159, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1973212456, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4151043049, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.428494509, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.716402644, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.428494509, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.716402644, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.428494509, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.716402644, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.428494509, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.716402644, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.8578928093, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.9422733087, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.8578928093, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.9422733087, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.4896430867, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.6750223515, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4281822436, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.4219577706, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.6679016788, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2453392175, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5365332656, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2910624919, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5255862986, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.3868757399, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6514359547, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.4210537268, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.7001171094, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1991040145, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.5338904589, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2423357235, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.5675102324, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.443270969, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3865584077, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.7076640193, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.4881010345, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.8110307349, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3865584077, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.7076640193, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.2767906931, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.694645353, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.368528912, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.6989312471, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.429848247, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.7395804946, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.5275280991, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4094709586, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4738480793, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2445665611, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.6506028605, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.4219577706, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.707627182, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.4219577706, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.712860367, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3584668928, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6348630986, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3584668928, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6348630986, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2397212592, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6266330371, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.4206288824, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.6813469637, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.2600960555, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1989810735, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.5339708888, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4770332229, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2164431164, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.6255338654, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3942058093, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6294033705, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3942058093, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6452705346, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1712473045, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.5272789143, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.2111187176, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.5086920945, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.3954512194, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.6541357657, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.4328182641, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.4282924874, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.4056299815, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1841353306, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.5210859722, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.538368094, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.7860964064, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.4787974949, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.7133324771, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.3295245162, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4924875779, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4021713046, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.4199894419, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.7020733406, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1675856372, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4598125963, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0787543315, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.2638954514, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1233463014, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3570869172, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1915319533, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4035796399, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1979009586, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4684771025, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1804170093, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4385244892, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1073408885, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3394679635, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1249928726, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3031531069, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1431831723, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3567561178, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1950672443, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4479378869, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1519743694, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3727100036, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1779592052, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.418629554, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1706064418, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4054584763, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1767019939, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3668222737, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1266280767, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3421762779, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2026698858, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4817971916, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1938804841, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4436170238, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0516685469, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3008745507, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0752378866, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.2771251147, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1401600076, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3800106322, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1733774759, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3602154896, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1237012344, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3333186683, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1363639818, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2898718275, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1120973071, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3136454052, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.23687866, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3841141484, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2092329802, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4391664942, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1558980257, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.378942068, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1569702195, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3714913924, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1074843144, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3292908635, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1327954312, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4156436577, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.133037981, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3647236067, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1948502779, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3552581598, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1237039655, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3658305221, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2119411486, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4350656027, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.199888698, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4809586782, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.176968806, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4304703803, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1618333627, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3458746997, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.177405522, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4174119524, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1442495031, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3320792016, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.186464805, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.384706931, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1718337984, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4265037421, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1739311121, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.390428122, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1443757069, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3403124595, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2020425406, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4063113408, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0921560702, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3442184232, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.229220723, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5075702211, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.190646897, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3695492182, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1959125091, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4012747454, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1450836461, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3190746194, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2211061599, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4075369928, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1139786751, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.439050138, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1785851273, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.38007334, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1092720908, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3154924313, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1439962219, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4092763412, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0867043106, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.344059045, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1885132032, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4118109845, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2011394318, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5054929216, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1237100149, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3523308147, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1433426997, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3181383362, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1792100757, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4219795466, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0663830136, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3361782682, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0708828152, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.1725752257, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1141404109, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3500627311, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1313979824, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3491182293, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.192722549, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4132550155, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2327204102, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.5347837552, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.1190141333, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.2908877284, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0710365684, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.275344202, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.1332963021, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.326901495, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.1804466262, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4057030488, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1596499518, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.358130588, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.155938575, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3832822127, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0396462656, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.1633851469, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0560466756, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.1884168481, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2096494314, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3690324235, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1408659824, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3613700886, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2110772064, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4391150618, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0393770914, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.1561676171, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1206688552, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.2616326727, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1359614567, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.2880980105, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1608400882, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4945344612, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1382794788, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4010585708, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.2520901949, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.2127149386, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4803275784, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.105555485, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.369837221, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1605078796, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3607284417, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0544527214, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.1778611321, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0739443014, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3084556368, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1462174256, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3347750166, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.160818779, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3641324834, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2551350395, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.5313546359, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1378820316, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3107655646, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.1709984622, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1504584503, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3596796797, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1505540762, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.2925093305, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1634286453, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3969874269, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1941893922, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3901489833, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0483040779, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.2397015969, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2065392724, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3737641014, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1930726574, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3601509235, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1945423193, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4706222269, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.2080824448, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4427653694, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0968739317, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3579218621, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1111961001, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3079247504, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1321058296, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4148432475, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1334077034, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.353859986, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1276840555, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2760466632, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0780295493, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2439534508, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0869662189, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1961381404, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1053768783, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3233296515, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1575728667, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.380676919, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0544138319, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.2401823262, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.142698681, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3178612043, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.2040655697, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.376089573, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1296171694, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3033295225, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2384341858, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4082320856, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2697022372, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5172978598, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2372622546, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4900486445, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.1901403577, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2680281173, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4784291862, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4945887662, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.6179893618, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.3063009808, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.5439056051, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.3059872017, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.549945787, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2007634744, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4962551545, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.3501359482, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.6055612825, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.4152031383, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6485212541, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1985084237, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4358434184, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2841613094, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5096201523, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1134451991, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4186167763, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1725115511, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3315849141, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3723330253, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5112697991, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2017033512, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3541251998, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2017033512, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3885781004, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1913937806, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4390566098, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3530697921, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3857901148, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4926358895, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1050810664, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3182774829, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1214053826, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.301883424, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1942053406, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3642322841, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0982997996, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2894553916, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.16885023, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3897135624, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2309552735, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4397565698, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2188392829, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4140411856, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1427059628, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.2812419411, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.306043488, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5282587184, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3325026294, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4580563104, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2353003372, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.462086073, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2936164862, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2051247604, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4188771621, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2835933397, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4681874025, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.4824794738, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.6479459161, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.3728402746, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5528347505, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2699951685, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4828357047, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.3745868968, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5282052117, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.3943334862, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5908849928, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.4656455051, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5477103601, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2887308473, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3884617412, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1349784947, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.2945184645, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0920736585, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.2745662608, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1572597084, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3365623219, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.485644095, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.592399345, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1548729353, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3929349486, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2746536545, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5102501784, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1815433909, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.391346969, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3014400188, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5581447528, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.3150760289, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4551575102, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2174185304, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3535910166, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2217113122, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3447082087, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2006070365, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3557846262, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.2673037873, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.648590256, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.7627201392, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3362681996, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5466581859, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.4947540499, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.6678485037, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1375371447, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4743993715, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3543589929, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5568265126, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.3871334683, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5376493568, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.3200033164, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5480591856, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2092643342, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4046472013, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.1575821848, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2152072672, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4179680482, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2478022358, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.491240125, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2113263008, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4175670766, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2255468433, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4891635966, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.1370370496, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2292375927, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4025389388, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.5543498698, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.7016802878, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1310836926, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3929302742, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.3648490408, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5682825804, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1799729111, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.417212745, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2543023714, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4790404367, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1320382335, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.2828076723, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2017404545, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3372929884, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1667112121, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3259291853, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1575675177, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3206700573, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1620103883, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3071134953, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3742031646, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.6481907872, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1087866109, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4101850467, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1463698595, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.42477479, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1349098379, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3721166388, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3453936507, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.3236570703, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4584149295, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1389436247, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3571046188, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.137636667, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3516386852, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.2411398276, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1548763492, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3683148867, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2663716042, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4646735366, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1958506347, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.372592422, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2019101909, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3773476048, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1548763492, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4072395634, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0989549941, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.2820930896, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.4174908454, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.5512835123, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2661644793, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4654663366, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2120354775, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4561052893, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0864423735, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3200397806, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2816688976, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4757360013, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3924547709, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.5302932216, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1717115978, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4250539223, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.171852621, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3551447462, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1859746857, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3585545206, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1894523533, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.424355484, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.2989691017, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.4142365762, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1524830877, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2035768143, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1469126404, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.3211565002, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.5113942347, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.4747560411, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.6309823583, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.2685172542, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.538503888, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.2528466674, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4890665991, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.2120879887, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4413963062, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.3453586867, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.6504104767, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1283205561, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.194339444, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.144821893, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.2913876816, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1217802107, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.1931459873, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.0223039199, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.267848848, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4282793862, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1441067013, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.2402520759, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.163069571, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1421938964, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.355094502, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.0135019379, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1383930915, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3524547207, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.9199349283, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.9199349283, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.8827916928, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.9278293769, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.5919743411, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.8142101617, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2743406515, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4551761514, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.2811228385, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.2624404628, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.2044894276, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2893773733, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5046355815, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1146038414, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3230886173, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1308613527, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3063146287, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1508271374, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3293232641, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1327211341, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3314509193, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2380622727, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4340156073, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2297430099, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3576672154, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1278739555, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.2193151599, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1206624176, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.2754556887, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.0192832489, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1077448901, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.2476800411, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1812045837, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.1864970369, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.1441966459, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1016310669, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.1449839903, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.0118394259, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1828304652, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.261122481, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.142888152, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.1495731661, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.15892175, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.1223899131, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1802916852, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.2500534855, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2695829028, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3771988117, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2767504847, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3780460244, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1891598354, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3233732862, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.0223039199, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2511187198, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4502536325, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2758862938, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4673996585, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1250361463, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.2062406434, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1453997173, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3142480613, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.0135019379, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3007733426, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4585623736, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2823442299, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.404086042, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3368893372, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2247529338, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4113282939, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.0258690763, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2249502221, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4140027812, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1781853859, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3686572709, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.2961559728, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1087256679, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.2806568392, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.111714465, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.2956379412, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1241635065, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.2326512001, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1284649702, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.2670865603, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1283783991, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.2740743526, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.0194337786, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2707832297, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3606120885, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.1877226619, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4516796575, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2825237412, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3549531183, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.1120375434, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.2450093988, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.028862055, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.3147237573, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.49783234, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1053163639, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.1577504735, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.261284893, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1369397402, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2484821087, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.196790904, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1607929865, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.259319196, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1789898551, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3097165911, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.2126837066, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1137814278, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.223407913, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.1529285663, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2723711009, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3950616414, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1574230264, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3220278551, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1888979635, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.390828019, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1484131243, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.2920414182, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.0195101085, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1616505795, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4196724713, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1485542687, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4089031318, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1736086198, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3517982963, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3493211336, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1911889636, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3809795532, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3506998338, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3460456809, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.462108393, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.25751651, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4024993164, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.2235704325, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2077198005, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4256662982, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2873180114, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3691291665, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.2163684008, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.1900122523, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.1590212887, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.27967228, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1858282605, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2793116461, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1362877036, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.1960450701, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2488272373, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.0141116602, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1127695881, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2856161525, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1087256679, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1812150267, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.0962409008, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0819661291, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.0854674391, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.0096280076, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1803546808, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0820617475, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.2460006523, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.2894206731, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1306975702, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3655209094, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.2836415884, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.2821274247, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1732999022, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5837818483, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3373556859, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.673878917, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.4059531821, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.7392702727, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.4658089028, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.7584810979, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3654687885, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6925292675, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.444673026, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7559084687, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4347813218, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7018196084, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3877278798, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6833268597, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3752981126, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6378039241, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4348285114, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6920474811, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.280389371, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.503849475, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2571849599, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4369258128, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3035527426, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4761172766, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.0037622272, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3457321731, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5434124381, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2989825849, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5979372542, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2183240532, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5385996669, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3115768268, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5357057702, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2586945044, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5387430999, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2933957201, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5936892247, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2607899218, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4870249896, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.191121255, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.39870105, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1905322718, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3856189129, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.248309228, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4179013561, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1471509436, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4120014457, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.161587186, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.529420843, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1181515336, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4449148299, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1643968721, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5023375866, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0665116326, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4270729969, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2366816362, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5999794442, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4280674425, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6762864075, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3476608426, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.626295616, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4264340684, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6927790189, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4484733265, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.7011327082, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4284560652, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6829784892, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3151326247, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.6088063321, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.328480037, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5845846161, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3725587542, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5802452419, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3178390602, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5668993446, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3193473734, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5461880374, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3357114889, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5776277216, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1659171786, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4778817765, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1589577308, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5058962769, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1647744547, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4598199643, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3834925244, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.6550089442, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2715808911, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5912854464, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3561131938, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6360822052, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3253181782, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6040157598, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2867189645, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5412439326, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3716909306, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6400806371, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.3000602447, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.3256826625, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.200222167, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2547579645, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.1250604585, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1308907403, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.300747771, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.3173961463, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.3328662057, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.3421549061, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2013896165, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.315443766, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1801035326, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2514369893, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1111050348, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2281901709, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.0059808612, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2260510897, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2500902724, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3575554083, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6357905859, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3834139647, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6437362314, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3554972581, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6081126361, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3772896178, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6184118091, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3438759684, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.620308087, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3212586103, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.620034408, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2954260352, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6045890208, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2334956542, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5824998908, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2520855788, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6062602862, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3841455225, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6295439096, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.260458933, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4556002625, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2576953652, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4479264653, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.3051867938, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4981245027, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2079098647, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4381081083, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.3840172214, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5461608433, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.3320200379, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.6008057921, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.5169325988, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.7139612819, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.4906167178, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.6748518136, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.4470391996, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.665558212, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.4492908061, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.6890808549, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.484685137, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.6277597963, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3004426157, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.507295912, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.350814921, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5412873656, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.5060360517, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.6405988584, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.6276032282, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.7074650729, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1016723331, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3890033984, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3452100271, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3365774376, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1121249014, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3581016714, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.153076948, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3899957108, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.3118864894, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.6025015601, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.413605391, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.6322647536, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.3273823162, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5178441995, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.3323940789, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5517145772, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.3852134275, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.6429066044, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2636126115, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.5725817956, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1678792928, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.5011442125, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.026624515, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.1073690646, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2421311685, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4880061745, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.3463282124, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.5555330144, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3192431461, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.564358704, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.464654367, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.6187472057, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3106871546, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.548144012, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3812607926, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5800153449, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.4214243411, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.60223322, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1422280571, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4996646755, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1986723298, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.47211934, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1786760469, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4403373046, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1106951975, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.410884295, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.188618651, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5044545567, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.3006555, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.5078021901, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2861877594, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4976123332, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2709988793, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4973599115, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2269082918, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4124766057, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.3564226671, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.5759796085, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.4571863894, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6765316874, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2842437601, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6165541832, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2790392444, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6162878623, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1969296745, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5972281991, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3108511414, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6249458527, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6260866791, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7122695616, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3856140451, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5942230347, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4780935793, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6515239203, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4501074091, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6258219369, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4729242406, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6516452342, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0251270888, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2103198089, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1472126053, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2721389124, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3131582236, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3759662761, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1677740288, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2760884587, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2504706648, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3683837339, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.233330942, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.49932033, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1115981822, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4729286927, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0704301723, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4191306757, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1701187421, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4260320225, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.115898398, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4642618457, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.4060492501, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5683580956, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2440631576, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4895502948, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1850667576, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3318090489, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1087869093, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.2847045761, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.3388231819, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5047311452, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0764069043, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4641021856, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1630562636, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.493101771, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1006070178, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4914538834, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1212389814, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.49565292, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.198935439, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5787262396, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4264281996, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5686715594, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3755133068, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5350958966, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3604013045, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5240948376, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4238002737, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5825787223, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3589634609, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5234247996, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.4877316024, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.6806798636, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3052856554, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5318320484, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.4256487928, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5834916199, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2816107594, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.477082609, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2595156374, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5213735061, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.0905633892, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3583129188, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5383434353, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2130989207, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4807665621, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.275156839, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5062735872, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1387856811, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.369259047, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.7332676622, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2270143682, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6596565789, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2175041217, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6503148633, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1255606329, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5394589085, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3365506763, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.7035699247, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.1884239372, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2423459309, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.1403347529, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2185459073, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1544051366, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2009434646, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1994738801, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2058451682, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2147557194, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2333215266, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1908993043, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.259628071, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2262772028, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2839086021, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2533922732, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2943322309, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2040769216, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2928742362, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2478061172, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4713415477, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2207122704, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.456253588, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1857249984, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4463428333, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.160459621, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.3992610986, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2169620287, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4507268789, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3705172113, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.649810457, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2580007064, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5822544211, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.1726118391, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5023852141, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2359703193, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5552647087, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2629904893, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6085636416, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1036182363, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.431058131, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2230178035, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5101738086, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2022608472, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4830960721, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2937928217, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5533712219, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.4348610152, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.6160254004, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.3679493367, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5158310723, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1150400387, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3409890284, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1441776939, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3580744505, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0817671554, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3376841808, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.2774818103, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4411307983, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.4055164993, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5930648847, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2639360931, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5375555616, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3303117726, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5601682753, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1750331258, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4313311083, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.4390048534, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.6549871625, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1792900088, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4496535427, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1623601433, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4898951518, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1573584287, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4685781724, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1886209475, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4517676089, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0920251528, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4638593627, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1250729424, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4138228239, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0966208016, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4004063787, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1258253277, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4333298888, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1010151447, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.343349718, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3449932176, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3193029809, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1884342388, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4066192083, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1908128615, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3911351097, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2012073364, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4077641023, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0823759385, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3921113359, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2859964336, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5040359554, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3129064463, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4818397472, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2929916735, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4808831615, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3120625544, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4961726332, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3648098913, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5125064136, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.195985918, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.482541346, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0949057459, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3865255231, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0586605592, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.377197891, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0679939505, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4163550142, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2240898503, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.54154916, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.3033134628, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4755698162, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0127704703, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1075718894, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2361892255, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3941806818, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0858944935, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.276064987, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2090466302, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3818993802, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3999768728, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5906362816, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.52088337, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6368157604, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.524831709, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6599904809, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3727105528, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5475770179, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.4788542814, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5906564992, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.1743988338, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4684683281, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3335763232, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4822714438, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2462820359, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4749074723, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2865635502, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4320753872, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3737090686, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5762937358, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3048576564, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4770499606, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3346942052, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4080244616, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.4747315562, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5626366883, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.1308491772, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.5354938906, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.6350822218, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2490362691, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4211642021, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.4691649771, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.6210364771, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3534673786, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4641989602, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.056547436, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.1884054524, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.4929713219, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.6254707348, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1736104767, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.393775893, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.126460717, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3539946558, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1276008309, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3476941267, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1006991959, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.1745141145, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1884527988, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4226648432, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.5294442647, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.7281375073, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.9336510696, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.958650753, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.9336510696, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.958650753, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.6337520241, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.7734740774, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.7096224668, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.8862932371, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4947542579, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5906548178, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5099580113, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6038542863, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.6369088067, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.7248557877, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5948162434, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6684517153, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4356351975, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5621273473, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2945813788, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5492390632, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1546384187, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.3842787636, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2366578533, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.3856245148, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.328502066, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2359066675, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4765138747, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3067124926, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4473439946, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2822493398, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4650791383, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.4190273601, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.6029944828, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.173672033, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3714461699, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2129735961, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4468251761, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2753456537, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4157637471, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3360301095, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.501569143, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3264610954, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4838177775, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2761209759, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4424892418, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3981901965, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5022380875, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.1138894687, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2353205597, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0804938628, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.217350608, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2956525254, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1041367752, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.1252616458, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2842745976, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2388293565, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3198037877, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.3223153471, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3862935529, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2406079909, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3958883558, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.1218838983, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2078806325, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3136877001, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2318330748, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4860771999, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2913081396, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4751771262, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3469521957, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.525360847, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2250790396, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4530321846, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2968580869, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5231126813, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3593341086, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4858623213, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2697896652, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.3998510332, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.243735105, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.3861458, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.286697952, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4328892686, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3354179041, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4707359469, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1300236097, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3252515328, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2943194787, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4483746666, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2125494232, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4269647769, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1841823461, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3926618248, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.3128940106, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5097722113, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1015499098, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3241234761, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.079112239, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3284566287, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3191396327, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0962868698, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.195215486, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1913038578, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3835123675, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2875779878, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4020991165, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3288944381, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4440807082, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.4114907933, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5085164165, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2002896041, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3388229413, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.360086008, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4853098817, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2899749804, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4921335323, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1409707879, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4079828299, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1314184908, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3328394281, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.1529586444, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2500778673, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4549489332, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2310235481, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4512153003, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.2408004587, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0809718104, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.305359525, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.2889508584, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.122781136, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.2856968511, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1387209969, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3380551337, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1352931404, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2234340618, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1840332408, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.317973804, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.1620137044, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1330402086, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2717234469, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3079971615, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4820111162, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2869584903, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4998009182, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2346948461, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4172389095, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3192819492, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4961701104, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2557514081, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4498199144, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.3264083013, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4603285066, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.259343251, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4745626718, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2016006518, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5098889524, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2398195555, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4808731682, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.3308717914, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5800788401, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.083279168, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.2503889973, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2036833814, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3653296593, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1810871976, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3325373478, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1542033805, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.4139653948, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.5525295779, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.4763100915, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6668706098, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3312076918, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5907489769, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.5419642317, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.8375813242, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.4506908225, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.63996736, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3044867545, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5152255321, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2021780304, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4743589083, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.8492326636, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.904853094, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.8492326636, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.9226314544, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4267826722, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5025756331, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1471005213, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2322531742, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1942744651, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2821379317, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3079393721, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3927110552, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1928576546, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.270808948, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1587572218, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3353137004, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.886247642, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.9357668561, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.5181212746, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.6637469241, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.7608566263, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.9001274946, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3019157873, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4698220749, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.4399331705, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5265527952, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.3419094567, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3847189235, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.4012265866, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5789876781, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.4005128871, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5795148403, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.4012265866, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5934450566, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.4499781507, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.525580448, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.280395012, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4511058291, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2818720424, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3950106268, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2843329182, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4886785606, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1665240823, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4246320308, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3013982925, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4053314221, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6060585354, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3264348007, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4480048056, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3259481889, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4476144545, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4064626339, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5788471954, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.2693965184, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4991283953, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.36210097, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5007651303, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3875738939, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.6165609648, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1950050755, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4506131026, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3563054845, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4957192174, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2482606597, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4805206362, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1252209667, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1209593074, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1142206843, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1272693266, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3016275716, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3187271473, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5308594427, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2015807475, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4601245932, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2195152443, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5863542368, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3187271473, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5195515317, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.2641917897, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0318358959, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0303845602, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0523062047, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0682355626, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0846491228, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2847994216, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3268532843, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1644290227, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2560785882, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0959478503, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.1059959233, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.1450038761, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.3981163195, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.4004997066, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1371497117, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4028673945, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1420515519, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4282852879, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1420515519, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4282852879, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.319417405, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4712019524, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.255518483, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4454321915, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2425888287, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5303410271, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2524885334, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.478828996, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4778863492, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3299895473, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.498417906, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3152861344, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.49782107, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.0864442659, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.3191159906, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5859514293, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.5894330056, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.7233859304, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1750913104, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.297354245, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1663850537, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4350932502, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.2291100391, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4752055978, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.3842217689, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5778946518, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.4239615629, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5537191421, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.4392283616, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5797315908, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.4247462711, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5232906543, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1075287508, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3325883825, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.2058307936, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.2107657819, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.2130422727, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.1462550512, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.6870287466, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.7656691937, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.5948821108, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.7754376703, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.674043327, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.8187596, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.4887049965, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5696145524, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.7248600508, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.7668237606, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.4028304605, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.6078521036, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.5838997128, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.6318158012, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.572193392, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.7452043729, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.4343409883, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5541452606, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.3097893907, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4783527071, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.3875738939, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4061202407, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.4478039778, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4520078854, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.5013053504, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.5258745855, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.4331017717, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4713714415, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2033075084, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3604872182, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1466968641, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4859054131, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2034208182, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5749290926, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2034208182, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5749290926, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2034208182, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5749290926, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1930040421, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5580822624, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1939469894, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2682569699, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1866149123, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2813929671, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1883009511, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2661819569, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0435779151, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2047856964, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3218527897, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0978416821, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.2989494547, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1333681278, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1445394036, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.2337549905, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.4978067743, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.5375886122, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.5703017173, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.7850913637, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5226605905, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5272140519, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.469268501, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.5107231091, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.7257353761, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3200158957, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5274343389, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3186919152, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5973293883, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3128418715, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5961262622, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3022215252, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5926217013, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2893311641, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5515215768, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.6666467303, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.6471929786, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2328789695, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3483528858, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2328789695, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3456033257, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.200389085, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3836585468, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3664818394, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1404678995, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4700598489, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4348498215, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4348498215, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4289684146, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1475256904, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4128304713, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.309770793, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.449153775, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4088404018, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.3026286473, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4888814491, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3572266803, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3597127268, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3074223162, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3309181567, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1627690506, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4116725746, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.2538149474, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6023865926, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.2082883818, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.391912772, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5056837352, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.2180019396, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.3968860255, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3787865613, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.7119470941, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3022215252, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4946479234, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1423901521, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.3901105746, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.393621915, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5349231274, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1361769926, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.3723385637, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3191354334, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4641046312, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3795275164, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5401652762, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.4063299619, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5674287432, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.4216383985, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5776987777, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3205353201, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.436221067, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3598105145, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5180775172, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2878333694, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5587364816, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2878333694, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5587364816, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1636332971, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4085613623, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1408710585, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4105428764, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2903680252, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5539971387, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.4718372009, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.5143710449, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2167183006, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2271978215, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.3541296817, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.4347460768, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.1829565422, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2454264181, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2920066582, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3605231024, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.3813114672, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.396813506, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.457015118, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.4585873078, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.018115942, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.6061105882, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.6319310382, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3841997816, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7084389853, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3212854968, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5882101692, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3212854968, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5888103425, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1767874865, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.501117963, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.4853620478, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7648536899, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4617549487, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2460137258, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4970122504, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2222984955, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5180400951, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4768696921, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.1440238603, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4789487224, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0997061711, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4157699696, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2567840481, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4451755318, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.2553868974, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.1933452462, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.293791183, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5236831459, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.3102922353, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4915321839, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.2574866102, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5470575133, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.5006114305, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.7491334026, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.2241905682, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5391137757, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1764052032, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.473410834, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.376523994, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4294400247, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2833048493, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4307098267, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2833048493, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4307098267, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2833048493, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4307098267, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3855945568, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.442526126, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.3497346619, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.543713166, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2134933297, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4394062814, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2243788763, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4280898947, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2590626038, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4529830758, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.3307716989, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.6040822482, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2516546237, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4948297816, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2862280733, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3769292787, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1800282927, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.403106949, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.3196106623, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5296986869, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2617850445, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4734548341, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1859237021, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4365745598, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.5931895311, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2876125228, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4827207643, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.115087118, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4108808712, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3362604354, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.538764562, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2560635442, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4885655705, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2560635442, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4885655705, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2557785047, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4889726939, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2560635442, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4780977367, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4257336921, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3856475022, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3311338569, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3817945701, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.3475331505, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.6686626267, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.3538049407, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.5074236666, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.335386219, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1471049942, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3568052877, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.2531894608, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1586578315, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.33433809, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.6158161555, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.8568982836, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.6535194995, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.8909391457, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.6535194995, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.8909391457, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.5088645485, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.8116199676, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.5088645485, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.8116199676, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.8151678596, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.8873630456, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.8571061117, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.9060265113, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.8151678596, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.8873630456, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.5386933265, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6707532211, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.5852187597, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7147018027, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3168482272, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4984008176, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3168482272, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4177993106, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3168482272, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4715336632, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.0183433739, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.368224131, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5450474312, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2559035608, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4786634069, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4146932034, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2371332025, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4712410964, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3762184184, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2462292439, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4831201029, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3351401412, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3832378602, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1635655188, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4304115185, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.2833653799, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1749329866, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4597805061, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.5709867733, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.8984616833, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.5009303658, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.715138778, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.6721494117, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.8222964288, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.4359493825, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.7459582756, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.4720758039, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.8498299926, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5294365116, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4115919884, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.408214313, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.510906315, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4572935209, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.4733115267, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.8148863882, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2035245828, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.6347163228, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.377384826, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.7950074174, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1452964737, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.6260669205, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2411108351, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.6937177459, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3449754051, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5521970778, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2030408603, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4269249475, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2030408603, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4269249475, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3112389764, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2175445226, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4621999155, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.7948343661, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.7747058711, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.7948343661, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.7747058711, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.7948343661, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.7747058711, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.7948343661, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.7747058711, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.7948343661, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.7747058711, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1342195244, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1672261436, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2147000595, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.3190887215, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2723297594, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2618225776, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.315404285, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2210933301, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.1650999034, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.3758546473, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.36761798, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.0283502344, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.3231493409, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3101339436, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.5526778778, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7267402732, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.4779289657, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6131584717, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.5034231828, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.718579705, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.5034231828, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7006437933, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.368528912, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.583972703, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.4721001028, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.7096678127, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.4336560555, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.8096970872, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.7016116563, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.9349183533, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.6298777848, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.878403256, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.5642137945, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.8202028423, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1307201098, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3105434451, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1196775895, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.2800855103, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1641721567, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3694792885, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.127438001, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.2780344257, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2935328201, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4343450424, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3745324928, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1347176685, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5276176357, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1587572218, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5368911831, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1381779039, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5050266838, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1356697961, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4650537985, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.319952675, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4662509731, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4343790315, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2970991782, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.6304107643, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1452762028, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3233041458, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3744741718, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.6453688418, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4012179884, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1751062735, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4866409707, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1751062735, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4866409707, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1472462377, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4296561365, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.4035471681, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5496664963, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.4111336169, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.6541511334, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.3911104257, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.7162899586, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.3044269773, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5765179984, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1777011474, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5263352658, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.4447630178, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5830457052, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1356697961, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3869963101, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1434533437, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4325933877, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3182117086, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4064888217, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2180019396, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4699679053, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3070257186, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.527093728, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.322821388, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5545363549, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.322821388, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5545363549, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.322821388, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5545363549, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.322821388, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5545363549, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2861555645, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4630699599, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2291421308, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4574939601, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2850782271, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4891358901, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3208090524, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2520126751, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4174826402, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2898497052, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4696277526, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.4010889715, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.5073411865, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1942823117, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.451675729, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2250265948, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4199494351, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.3693809258, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.513005525, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1611121224, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5162765195, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2310953637, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5693079918, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5052082359, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1799107865, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5159811845, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3550420051, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5693079918, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4252891538, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6269243846, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6486932415, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7886867104, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4983116255, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6906494695, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6486932415, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7887116805, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6486932415, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7886867104, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.7490853969, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.7869453805, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.4970449067, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5549084693, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.4713668887, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5328387001, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.6158362063, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.6672191436, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.4646317993, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.6658302112, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3093406614, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4556857835, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2982935803, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.6025685351, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.4546828805, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5363479232, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3917244018, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.634289822, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.3237596834, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4184987692, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2658380217, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5022872142, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2928787573, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4637938557, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.5728145662, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.7040427612, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.6169034543, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.6942951271, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.3357306484, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.6896084088, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.3294509143, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5502318838, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2589451141, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5228701285, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.4784380961, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.6639502808, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.3975205618, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.7019684122, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.6102624547, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.7455382911, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5129914365, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.67190581, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5129914365, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.67190581, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5119999466, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6745099803, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4949431899, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6525478644, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.18558816, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5082547077, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2510461568, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5386684377, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2359267733, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4722703389, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2287219601, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4750367449, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1423901521, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5183430109, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.4158130625, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5675993368, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.0342345368, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3041065177, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5406223711, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1602072099, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4494779998, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1573693792, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4141688451, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3910803275, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6466158388, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.4464617303, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.671951878, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2291421308, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5523264448, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.5718458251, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.7377760377, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2291421308, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5523264448, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.3964023717, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.3718976854, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.3063889665, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.3060606493, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.4392283616, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.4449696053, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.4226235346, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.3911861221, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2560951677, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2815384743, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2130595648, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.4395285387, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.5439405004, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2348836444, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3379049313, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.0421351537, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2348836444, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3379049313, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.5194247347, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7440660672, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.4093184131, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6844082267, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.4093184131, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6844082267, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.4093184131, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6844082267, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3902273664, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6827449888, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4696150969, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2265672091, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6312451922, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.1899243506, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.500884399, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5116579034, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2153539712, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5925940105, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2882258334, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4424981884, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2882258334, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4424981884, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2882258334, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4424981884, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2882258334, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4458584062, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1697362853, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3381210713, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.2128170138, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5028404617, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1529555934, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5217846955, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.2003652983, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4411095117, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.2380400381, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5256271785, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3957831378, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.4323312774, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5997371746, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.49935842, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.7295897847, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.6510651028, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.7734123057, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3606966647, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.571396397, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.4622787126, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.6461151023, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1637368249, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5249159229, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2966347936, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5048860636, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.3790331198, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5564797446, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.3785063589, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5506535618, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2179883013, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4809891449, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4784684191, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.522074413, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4546747838, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2392702602, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4504639375, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5107881984, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.438460371, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.5878523089, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.3049156496, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4120879324, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.3635609139, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.5425942882, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3727355698, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.536698185, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.435040381, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.6606468296, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3265516874, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5955775051, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2392702602, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4508373082, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.7071067812, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.8568176228, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.7071067812, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.8568176228, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2660812518, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4802266387, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.296609032, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4660692266, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1824016291, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4735258457, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2872797668, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4999892148, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2872797668, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5378134889, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1969653399, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3627040803, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4425219454, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3847693175, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.3547910527, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.616414738, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2989467365, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6322815923, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1833025609, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.532839114, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3478966138, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6662710525, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2169730141, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4876777358, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2907703617, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6671226464, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.7416488037, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.9156308979, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2924496936, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6040522124, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3561185946, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6591871482, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3092067389, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6104451102, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.5430702341, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7506439741, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2311930167, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3547822876, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2041933345, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3947029725, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1459922303, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.287186852, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.0680779228, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.294610633, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4117700236, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2623060932, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5822825438, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3131514736, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5852253917, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3030832087, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5712741348, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3196102365, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.6246652359, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0332883722, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.0222790845, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2255166571, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5279805413, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1565711241, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5086519721, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1258220556, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4723958268, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.141359839, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4830716883, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0351981682, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.0159737507, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.089055915, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.392589918, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1683929873, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.381545505, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2248128566, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3861073517, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0729263925, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3325364977, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1774329946, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4899555753, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3414076547, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6319466141, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.2259250193, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4846944834, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.2928926658, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5528145632, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0986132217, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.3428977475, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3331101711, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6152393361, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2457249203, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5262167453, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1809849704, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.518347761, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1946439942, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5198306336, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1984776125, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4798124824, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0359956052, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.0165678101, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1154324643, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3867652323, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1752510532, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1096600595, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1626044146, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3719686647, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2574866102, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5192222794, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.4165851519, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.562626404, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3279697678, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5237407368, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2007935232, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5138627524, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.4470201256, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5730388207, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.20624077, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.1636538054, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.270306405, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.253393528, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.3563911216, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2046918777, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2562732501, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2905178492, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.4540869803, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.4416037594, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.5926552553, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.4183954029, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.4906994718, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0140731002, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.1919522337, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.5821113313, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.6682049424, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.5441799558, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7471708187, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2737674172, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4929468277, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.4413715884, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6477253957, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2900657692, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5959886772, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.5465033075, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7499074935, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3609260083, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.649671408, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2322365387, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6044384701, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3064251318, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6182391877, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.165115706, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5582712048, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2264993238, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6026783584, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2160530266, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5282568801, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2645853844, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5387766933, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1332400927, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4393875304, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0836079515, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3542995435, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1963524852, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.489147064, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0722880074, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3524948213, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3972317449, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4096483878, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3316829223, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.0041614648, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3972301057, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5673240078, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2769159339, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3972548978, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.4314404724, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5867820726, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3337026924, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4403514507, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.4913452072, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.6018727488, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.375663721, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5970100838, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.3798945671, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5769558961, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.233244271, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4221129349, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.3115230561, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5400649416, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.0190652043, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.5136268736, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.7472505674, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.5269786262, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.7211839704, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.4470417555, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.6464230283, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.4571832355, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.6782668461, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.0042900043, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1847300022, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4760100031, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1823933644, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.502934539, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.113792739, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4217370585, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0948679392, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4061568567, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2287860382, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.5140335092, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2488783136, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5200881907, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2413534424, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5466517514, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2240750868, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5045920246, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1959905436, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4875379508, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2297794059, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5735702228, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1129096545, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4125077608, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0922510128, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3735011261, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.0469373201, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1189826308, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3841920009, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1382412077, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4421654273, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0896188909, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3874168292, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0810085962, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.2445184945, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2601769109, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4554928797, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3216969757, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.4664391558, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.605420338, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2559186141, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4431886252, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3528573301, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5945202859, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.3494033885, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2506708133, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5592183665, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2553582779, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6051855679, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2809009542, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5819888907, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4573889291, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6974989992, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.5409314027, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.802347513, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.1137202771, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4398081737, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3615855225, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5942403749, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3487575222, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1582438233, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.284703464, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1307655888, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2688265705, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.0107154608, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2557741235, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2791475974, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3778334877, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3375832969, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4156592382, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2791475974, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3453692248, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2126360951, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.2685899742, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1912482271, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.2829340635, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1196671345, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4250373762, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.2805776239, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3746450748, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.2759077539, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3308083901, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2551158426, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4338792723, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.154267657, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3640443241, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2869066874, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5218678198, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1661865517, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.45189521, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2483533682, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.505707709, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.2885952308, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5243060036, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.425874468, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6780779329, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3964513253, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5953388302, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.1815358071, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.3893561044, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4884391792, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6793073122, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2362618716, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.525917235, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.140651088, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4653016103, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4188525448, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.125176864, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.3906486876, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1184766267, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4766412062, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3637736732, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.2840158072, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3050918119, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.2674112241, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.2680069355, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3112345209, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.475667469, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1850611533, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.509686347, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2662692826, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4932548717, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.2579969134, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1491932244, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4210541594, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.1651065386, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1451461303, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1479818938, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1384230932, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1025254667, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.10386785, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0744575239, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.1808124012, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2406197932, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3480566207, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.300208614, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.4112215755, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.0320626478, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2188350648, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.190893953, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.47754616, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1876296055, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5059052803, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1984324635, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5254585376, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1135808594, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.3797631542, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1876296055, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.493482307, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3108708432, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4849340358, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2843877928, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.528750768, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3758626428, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5683038109, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.1241259939, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.3894435624, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3375930269, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4797696969, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.3724134618, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5411724479, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1099151473, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3588978856, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1348135718, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4147071076, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.2941203504, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1923965056, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4584215933, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3022989529, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3201383637, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.2896934245, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.283806646, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3237479047, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2881907225, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4281025086, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1722187017, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4101544501, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.150072255, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3392953951, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1958720486, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3104671472, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2461253685, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3990423816, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.3164318652, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4990369741, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0972760643, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.342689178, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2285174116, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3905236065, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.11560301, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.295690976, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.087496553, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3126423888, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.291600602, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4185967939, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1645740483, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3333343855, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2673465335, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4408611095, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1398001346, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.2819303243, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0775275442, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.2751344778, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2061429004, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4026346891, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1045812512, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3641239192, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3208902702, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3438619395, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2249513016, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3898866357, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.4419177841, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.6137680308, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2556795749, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.3876058827, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2764393753, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4260558157, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.359338145, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5180379308, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2676032276, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4724604739, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.3914713795, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5396649879, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.3049871822, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5208588286, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2865475627, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4454875632, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1539576975, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2834099675, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.3203990808, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5773010308, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2896941452, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4170954365, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.2025417934, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.2105213575, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1554525645, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1686298661, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4974216936, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.30894994, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6495798577, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3580649764, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5522671396, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3391824705, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5823536572, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3369582032, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6048568842, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2164879231, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5842434739, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2532589714, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.511461689, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3730973285, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.592642294, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2147809314, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.532218679, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2720498476, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5456825635, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.266753372, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5290480371, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.9199349283, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.9199349283, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.8827916928, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.9278293769, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.5919743411, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.8142101617, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.16249656, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.476936782, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2112648086, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4132516612, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2265427297, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4258225502, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.388768348, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5513827117, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1604234263, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.468730386, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2044743997, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5296253104, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.09990096, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4354158807, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1401169793, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4782044537, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0880759031, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3086025862, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3472562427, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1689554749, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4875202059, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0986302237, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4410680148, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1059024181, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4187169529, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1111789549, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4609024218, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1187170429, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4586403617, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.1615782196, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5255622544, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.1574843076, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5300202362, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.1508931842, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4742831787, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.1439177735, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4521011409, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.1488860631, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4972935075, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.144734792, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4413634591, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1842259593, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4512010919, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2686541302, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4813075023, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1491263856, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.39836399, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2074208662, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4987857684, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4566114003, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2124502622, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5450614695, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2353412578, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5178557103, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1731210051, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5402176694, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4665729244, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5049599536, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4643058745, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.514192187, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.193632685, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5704206116, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5154606393, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2446802689, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2749771764, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2439938766, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.3044305895, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2005610751, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2780404942, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2694630167, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.291849524, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1651529608, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2497776365, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2123763979, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2071915239, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.0170096895, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.162615831, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2819800493, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2849456986, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5314415166, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2326954497, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4974997792, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3076407164, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6086887537, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2719751267, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5796304581, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2560035505, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5191300553, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.378025382, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6691463628, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2764824154, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6690579621, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3202552755, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6434556886, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2560315227, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.58147541, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2897057417, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.7234741869, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.2991476612, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3082702688, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3198590175, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3093019888, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.381228465, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1259590106, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4578429795, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3002210626, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1083616403, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.2822470724, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3083734365, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1628565646, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3859336137, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2686036309, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4679627865, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3211488647, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.429013072, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3174558825, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4724792895, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1960240721, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3632643494, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3128281918, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4675168561, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.3021887989, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4541987874, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2355248404, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4709821983, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2734403418, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4592757627, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2452145963, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3983800926, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.3847470794, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5248793759, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.260126021, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5371799695, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1413737596, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4881276326, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2524400151, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5432183114, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1680217412, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4767498069, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2198650169, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5475496672, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0515667467, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3669821824, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3430290995, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2103962198, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3552217342, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2984253657, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0995249808, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.3978595246, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1091680807, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4367149526, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1068190066, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4311441166, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.3941055693, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0901595152, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.411812523, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3845967285, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4131845454, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.309372316, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3100065568, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4784779258, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1407383559, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3186851469, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1109252864, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.316043836, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3032188091, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0764769558, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.2986901903, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2061578366, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3710107839, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-4-maverick", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.3-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3.1-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"meta-llama\/llama-3-70b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-mini", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.5068360865, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.6984477546, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.5679608238, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.7468819234, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.3393107079, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5427607577, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.3310002393, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5283894636, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.3472596784, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5880210095, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.4960282462, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.6821172236, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2511517945, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4484633445, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.5767974034, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.7416604156, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.5749603738, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.7240488252, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.561756135, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.7132694857, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.6303545031, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.7778513476, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.5812269907, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.7632349489, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.3604302814, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5648482392, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1531771948, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3880097649, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.6001453933, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.7620293912, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1968599621, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4529546785, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.3067694293, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4968492831, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.3671596072, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5953389856, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.3671596072, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5953389856, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2516114674, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5164808837, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.3276399373, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5131503736, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2334365819, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5188968707, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.3954414304, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5959322291, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2596939072, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4394574387, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4273817965, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6016204187, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.3972267644, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5952617864, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.3930690372, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6043335353, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.323749564, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5552439191, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2777551013, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4942324012, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.8562379115, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.9148801473, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.9878765474, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.9958930218, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.9878765474, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.9958930218, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.9878765474, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.9958930218, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.9878765474, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.9958930218, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.708662669, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.8167266342, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.9878765474, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.9958930218, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.9878765474, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.9958930218, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.6537803976, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7742226744, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.9878765474, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.9958930218, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.9878765474, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.9958930218, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.9577952806, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.984767538, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.7382380644, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.863773877, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2755180391, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4551354637, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4226799078, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.565167271, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2059670265, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4308095886, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2057575468, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4318610933, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2502214193, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4981965725, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2892582108, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5172170139, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1953965032, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4370535626, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4980275706, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6323394518, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4101914564, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.555006366, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4414649462, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6003092614, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3232734747, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5256417655, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4338913034, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6021209112, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2833191488, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4778413512, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1357635818, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4152919353, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2492633192, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.459975643, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3688167255, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5626506838, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.5077888484, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6493197366, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.393556643, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5739224928, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.4113107631, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6024368114, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3882758257, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5946895227, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.4225533488, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5840904424, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2417736009, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4699968298, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.5946872254, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.7456034599, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3681981336, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5359192372, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.4784060474, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6297473901, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.5009380664, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6679481474, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.4535479195, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6276625295, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3882789068, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.562561181, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2087397502, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3941006947, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.4640742082, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.637268019, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.30290763, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5118703718, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.3732667151, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5674650482, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2729277173, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5212657903, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2736066918, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5141172587, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2426576142, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4681164294, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.3464618222, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5286087759, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.133372824, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4379609517, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.4623862098, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6294498585, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.3186774372, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5594486932, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.3725907669, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5838909338, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.4641858541, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6257813924, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.4305805253, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5975873582, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.0006956038, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.213466604, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4749873824, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.3284656617, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5314089061, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3146876332, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.513230779, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3576035471, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5426399703, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2491599346, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4396481537, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2419210808, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4175394769, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2840596414, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4892722276, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2867782978, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5017473466, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2534929996, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5066198264, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3968190443, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5978315904, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3231223154, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5181020767, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3443388178, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5355920179, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2871697938, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5171262479, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2871697938, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5143386556, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2597056289, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.473469114, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.0544811282, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3360010227, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5216531074, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.4116786322, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5837404006, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3321094491, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5289420578, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.2303710197, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4814028637, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.239223165, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4470522397, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3909683537, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5861999156, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.406520103, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5957668555, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.0019825535, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.4692988665, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.6232055063, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3891456077, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5725189584, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.4100880948, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5748650911, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.5534146254, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.707494003, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.5215309395, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.6680522998, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3018199728, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4978437519, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.192504126, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4448372401, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3109333641, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5072760587, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3885745413, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5684937371, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.4475435253, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5956867227, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2634713516, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4853029313, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2719748745, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4991260833, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3510316028, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5432217849, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3940944668, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5436661646, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1840510532, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4424977424, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.5815914781, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.7321831384, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.4451909306, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5879542667, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.4831574055, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6238976884, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.366795109, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5743827294, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.4069863198, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5748668902, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3292629394, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5443707655, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0895824672, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.2467971299, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3511508048, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5023642198, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.3911696105, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6565815108, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4166560818, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6515522499, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4275922258, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6292567445, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4049392463, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6196675475, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4469713873, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6533822343, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4699943435, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.7050475306, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.3672054108, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.5562995581, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4576126417, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6880668163, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4800491211, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.7058154381, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.5803563388, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.7397216312, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4549567978, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6997352224, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4549567978, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6997352224, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4396453172, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6386415227, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0025767495, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.022849656, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4917930708, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6798382116, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3359905246, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5506683358, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3722464459, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5716341953, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3914166892, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5926049532, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3648850355, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.572324348, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2820342917, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5410881357, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.4159534389, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.6228483474, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3647006104, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5752487475, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.5444545011, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.6995635477, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.4475167124, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.6011479674, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.4611551555, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.6294324147, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.4186536317, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.6246787833, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.4510663025, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.6439430694, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2827898584, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5364084167, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1847406257, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3944315617, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.4044350003, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5937440273, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3497458686, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5486997386, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3660623362, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5840165125, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2667148789, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.51861541, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2667148789, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.51861541, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3495696951, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5497542561, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.1750935993, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0887521832, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3759098347, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.5116576339, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6761326472, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.404235506, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.556784461, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.4342485684, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.586275655, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.328462603, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.523468747, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3709295124, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5443097614, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3415769856, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5550034046, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0626814221, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2649283376, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3504606692, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.569698214, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4110978145, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5909828034, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.5005164973, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.7019407549, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.3422590337, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5784088566, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.3638250719, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5597199179, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4389167618, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6283965584, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4783304729, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6570361508, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.3179196449, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5391165578, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.480524006, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6678968008, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4870178701, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6571420749, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4544549778, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6588011478, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4720654627, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6517469394, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.5253138253, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.7137080321, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.3621629593, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5817525999, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.130814435, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.417733523, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.5333753443, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6915993703, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4649415353, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.6614464392, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4824471895, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.6756807439, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4291308582, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.6230860316, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.429066773, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.6259670174, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.473473697, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.6817862357, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.533503574, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.704064939, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.3655292172, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.5818586474, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.5963279753, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7384834127, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.5416689002, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7032606089, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.504355087, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.6689462373, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4628513443, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.6651586362, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.5244317205, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7076771206, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4884034257, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.6801218411, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.0049537649, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4857812061, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.6418878687, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1997940806, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4450142051, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2336337525, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.453927541, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.3008193499, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5592925653, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2871484146, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5435042612, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2405899516, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4522509934, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2755251639, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4769491783, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.226375858, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4191052212, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.4278755949, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.604902493, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1898809558, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4182314372, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.3477722544, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5603739447, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2488577037, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.470061206, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2858464947, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5073688692, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1926947735, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4068420923, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.1024690102, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2638043203, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4634992427, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1787758424, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4015188769, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3051960192, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4844089738, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1095771553, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3392444985, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1096488255, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.335638916, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.223471946, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4665650708, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3016964931, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4535427413, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1911861016, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4147709342, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.446935809, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5872096767, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2876764482, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4733049683, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3405965889, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5263364809, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.311453647, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5087911718, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.311453647, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5087911718, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2636532817, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4632598951, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.0042367004, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.371127162, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5606811328, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2883603714, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5083094175, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3465544219, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.6023567722, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2740037448, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4683631908, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2740037448, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4683631908, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2581097804, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5114862976, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.4026876779, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.6359049001, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2814359739, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4683320377, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0899445598, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2887022044, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3766776486, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5833210829, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.4644367532, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.6512173868, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.4244950971, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.6318443096, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.4244950971, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.6505130875, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.092266595, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2895289299, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2861220886, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2095556127, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4512525409, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3626791619, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5398369635, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2453787991, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4099668999, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1426882823, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.34960972, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.1936004931, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3215575124, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5282954234, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2976273272, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4476081667, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2354598833, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4060170573, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.5051170492, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.656611446, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3509316371, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5161806517, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.4187059279, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.580661197, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.4228659617, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5934357259, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.4207195865, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5867954121, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2817623234, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4634277516, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.2769409829, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.365609916, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5370723655, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2641697524, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4438864953, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.309153605, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5049638084, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2377283063, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4229894191, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2595156374, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4469237424, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2864402731, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4643839365, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3169600089, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4926956772, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1905285417, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4177320592, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.5476697345, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.6920019083, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3907048161, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5379358214, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3989298045, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5839375286, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2311953341, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4549622022, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.4718701115, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.6345707124, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2692424567, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4576088114, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1501956902, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3435352939, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3069270531, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.55312313, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.3718474297, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5563193852, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.4161334417, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5740077532, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2301547971, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4043490476, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1762902337, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3473939682, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.3116287423, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4893092448, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.376147454, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5536622992, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2459980186, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4748582129, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.4196211376, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.591599569, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.3785127548, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.554861331, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.4098335196, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5980339789, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.4084096041, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5662632888, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.4077296769, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.568189108, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.3627861054, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5248963545, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0472010372, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.1223770608, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.409392845, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5645111896, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.3844723738, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5612506237, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.4942847817, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.636086265, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.3038421084, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5173698637, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.3038421084, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5173698637, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.3367704985, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5762640587, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.4134997467, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5981100031, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1908020684, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4451297657, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.6611893921, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.7385527847, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.5472843614, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6462543668, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.4893668826, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6232884959, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.4986401345, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6473028954, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.4705190879, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.634829448, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.0006449948, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.1568844546, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.4711705838, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6028678287, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1666076672, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.438216367, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3109058809, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.504595183, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3121364739, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5563959499, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3121364739, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5563959499, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3657618229, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5569403582, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.29873904, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4908060991, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1212110381, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3665474933, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.4872311075, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.6623535405, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2757545333, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4738441342, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2898386903, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4975732771, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2806074146, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4965803382, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3681900465, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5504673899, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2210737907, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.447204473, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0738302696, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.1858211343, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3281444235, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5149345446, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.152372602, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4249945948, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2556346494, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.453803544, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2209414114, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4436055021, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2209414114, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4436055021, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1428350952, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3908013304, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2671559407, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4577424763, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.00210615, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.4363671958, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5525891005, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2512606392, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4210700547, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.3284145916, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4777770768, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.3256597499, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5028101514, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2993726299, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4773135617, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2507373946, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4528590428, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.2918722287, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2064920765, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4555957355, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2472606042, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.453644727, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2392120773, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4404453435, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2747717524, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4670076076, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2103835107, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4170983383, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3070946891, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5150001445, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2393813525, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4238287532, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1843911501, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3881716916, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.4484493594, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.639206193, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2927756781, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4753479834, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3407761683, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5278331664, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3126004767, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4866732007, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3024740133, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4860481291, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2147259749, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4190785642, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0562417267, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3317185958, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2624355455, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4888790165, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.3240726885, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5123210866, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.4048719917, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5637204316, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1986435881, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4520034758, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2851573608, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5144923376, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.299705727, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5028660358, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.3501644461, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.531896936, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2549773133, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5321857016, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.5138735428, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.6711767933, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.4891724826, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.6007992381, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.4507468191, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5985843659, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.3442651325, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5347748385, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.3777925414, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5639615032, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.3411216349, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5245337071, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.1349610442, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.3651626112, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5425947357, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.4651124441, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.6535569144, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.510862881, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.6929396211, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.4133668887, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.5851805477, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.3894258203, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.5648719586, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.4485994475, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.6258984728, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.5438057026, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.7108467686, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2723054456, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.5114823809, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.5629805731, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.7184729617, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.5392691323, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.6950593237, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.5248291448, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.6920934053, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.4257428978, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.6292455373, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.509815557, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.68428018, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.4102481417, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.6198489534, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0072148746, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.0949615226, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.4803498024, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.5963395991, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.31723554, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5055205673, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.3335262555, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5258955094, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.3516912179, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5464920089, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.3475771626, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.545629099, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.3038421084, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4957316235, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.3404669195, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5294979443, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2085744631, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4646612267, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.4213151124, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.6348713285, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.3215895303, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4917944769, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.3007845438, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4720170374, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.3506937082, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5735580982, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.3559980252, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5455195296, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.3056769536, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4994609495, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.0014196479, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2757973688, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4456052022, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.4706737586, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6417233649, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.3774268865, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.5674314406, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.3023325548, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.5203155279, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.3577099834, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.581833855, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.3625286446, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6148737882, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.4012050186, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6249577019, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.3705035472, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.5886100035, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.482783224, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6550149284, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.4974561894, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6671359503, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.4519603667, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6009987667, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.5542271267, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.72750495, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.4878448947, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6426554194, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.4345206442, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6585506299, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.327910617, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.5832612672, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.5350666712, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6501051147, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3549111275, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5468570449, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.339818403, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5156759219, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3521993876, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5393886265, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3045124488, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5270886236, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3215522029, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.550240158, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.4173085585, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.560162879, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1751902215, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3999732123, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.5730497087, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.7127638644, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3981933678, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5407088038, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.4647350187, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.614169318, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3862117493, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5629586598, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.4173085585, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5727286658, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.4031413392, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5857356073, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.4316336298, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5611890334, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1096281284, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3474392468, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1284309656, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.335620143, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0996328903, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3282252227, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1304767108, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3118749154, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1422293961, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3221271934, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2530426809, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4243735005, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2323169802, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3975460179, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.3134776318, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.5290306159, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2142422006, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4196702091, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.248093239, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.455254011, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2279842488, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4315883078, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1980038259, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3944477326, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1854257525, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3788879538, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.0013506213, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2275054759, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4160796302, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.4403035619, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6631416039, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3536676112, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.5252283198, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1902934259, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4662657055, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1902934259, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4672523665, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3086036522, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.5323991481, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.41255467, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.638679614, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2777982916, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.5451746888, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.5747867449, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.7236969475, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.5046818725, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6768618696, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.4698824517, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6509974369, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.4659438114, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6469293483, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.4778572891, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6889224434, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3442383359, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.5764289441, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.001973165, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3962672641, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.5928013372, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2481045173, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.52965422, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2348553454, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4891959124, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1893933851, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4905145936, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0706604664, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3470742307, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1658317981, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4396479746, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.189435696, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4523250861, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0051795097, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.076918404, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.5030879353, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.6846791298, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.5055953276, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.6788641233, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.4207214329, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.6265956117, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.5079711118, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.6900890596, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.4445682435, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.6567673472, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1258024774, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3953613202, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.074467124, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3048524449, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.3394216004, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.5399361239, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3308295584, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.5333110334, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3461114139, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.5537111973, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.2753998086, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.5086546717, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.2973669286, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.5307507955, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3898683667, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6181891241, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3666868346, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.5683418006, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1725434803, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.467904818, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.5181493033, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6641637237, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3559980252, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.5099636935, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3785839874, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.5535757116, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3201978308, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.5281184079, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.4147007156, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.613697628, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0202435982, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2294938553, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.162784213, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3513085831, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3057644277, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.5175418594, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.2401307751, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.4569168961, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.3734491517, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.549949382, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.111974253, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3419289955, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0858631944, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.281861395, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1841622666, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.029350455, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1848735107, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1650689516, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.4478336962, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.6267235014, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.3138538786, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.483003452, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0300411733, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1646127574, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.2871073612, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.4701937311, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.3249785838, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.5176680075, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1527358476, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3713082375, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.0257414882, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.21119557, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.4288316797, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.3558905195, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.5570369132, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.3612717557, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.5558371668, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1619935149, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4271616542, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1599294818, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4237133893, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1250807402, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3908878142, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.2501291156, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4242027531, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1072727956, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3337433563, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.5488130347, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.7204197306, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.4269590215, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.6090516839, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.3699375619, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.5932397043, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.4346391355, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.6487837276, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.3994868082, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.6159441456, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.0013854253, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.2464781979, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4673628408, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.3504567097, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.5647968278, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4463892737, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1581575107, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5152611872, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1446176982, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4699313689, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1446176982, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4699313689, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4031456247, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1586596244, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5308758517, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0851670089, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4091252891, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1583163322, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5032511267, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4370196291, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2066908627, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5076721272, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.156116341, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.50758145, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1155284124, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4154571914, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1467915344, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4372326744, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4122750003, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1541271916, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.50103537, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0553426563, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3968894621, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1236989269, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.445496109, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1487636071, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4833470008, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1481697285, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4827506957, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0665621394, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3843574133, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0919956587, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4320605493, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4272326098, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4295413952, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3532931582, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1753966146, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4973649961, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1609675245, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5069863833, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3986185684, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1080286655, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4137246392, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4041678259, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1290514243, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4766581477, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0955354346, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3531525294, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1242278855, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4022221056, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1202004095, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4201142663, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1202004095, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4201142663, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.2878905746, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1145335578, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3913231806, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0585029035, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3116709576, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1568418932, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4148511041, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0862817214, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4027209787, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1046775735, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3674985321, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1302664976, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4155075504, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0710254993, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3628384769, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0777111818, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3481063078, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.0397828617, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1175904695, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3996881234, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4042977714, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1371484559, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4549928159, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1518765555, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4991359435, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1518765555, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4991359435, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3878520966, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.078805405, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4311640428, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0817463397, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4119415264, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4312276313, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0759392175, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4598119013, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1284816893, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4421263684, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0919804518, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4598393647, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1319194103, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4054693593, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1024696341, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4016780647, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0779853025, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.40061137, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1454192396, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4757761293, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2223876386, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5765887803, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3026566819, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5945859352, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3939307348, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6204810134, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3939307348, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6204810134, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1881686819, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5179253054, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.4095908744, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6348509381, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3433850255, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6024262112, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2352210164, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5302138314, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.104162457, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4646795039, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0962906061, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.43565499, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2841812334, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5398164027, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2366492606, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5547657703, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1872127694, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5089836024, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3765959323, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6295826606, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.408012692, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6210533026, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0603679684, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3758142676, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0779303106, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3700181222, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1020472825, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3281153674, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1072035288, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3865302186, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2718653389, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1378484798, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3805607814, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.0683156401, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4551974335, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0986664427, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.428584562, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3327209336, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1777835118, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5166806074, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4056741942, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3500358866, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.0093964737, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1358290639, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4334491322, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4018656753, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4164965411, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.429788858, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.429788858, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0774937091, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3853293582, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4303918965, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3627375495, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0802555532, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4011659418, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4341678483, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4362239051, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4250905063, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3674996461, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3917400674, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3634780079, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0625467808, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3887428578, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3404791678, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0876721013, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.40476518, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1667371654, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4569486349, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1357822319, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4091221497, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0542289899, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.335890202, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0648249124, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3859593134, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3916659692, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0846571427, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4124028027, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.074350531, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.434640867, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3461792119, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1018673097, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4366564212, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0655232271, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3576301367, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3731922615, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0824897462, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4045677777, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1049671408, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4262440114, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0910767522, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4297036776, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1473850006, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4659728395, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1693459006, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4846672446, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1693459006, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4846672446, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0643329478, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.396058599, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0688337576, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4079414323, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0622505385, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.3357670083, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1262345212, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4305259422, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4502540675, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1724794141, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4832014438, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0975127082, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.3956177584, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0722235072, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4018992451, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0553426563, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.3757677532, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0630143244, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4249725533, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1824875393, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4759830743, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1063907795, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4445235155, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3370100423, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3805303131, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3984985733, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3538602132, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1174136855, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4489574295, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3599344656, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.090580172, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4576169175, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1049086753, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4381872831, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1676729299, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4691077977, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4743530867, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4066129165, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0767518875, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3985571535, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.083512119, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3303081245, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0752892768, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4225134174, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4351068028, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0908409176, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4286741659, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1110700642, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4423176834, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1110700642, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4423176834, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.398058944, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4277302624, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4186723698, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4357976698, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0764963637, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4589644893, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1264967289, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4132960986, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.121944907, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4776943039, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0930061672, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3802685084, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3692592583, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4606409591, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0799620979, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4279137012, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0797747599, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4136264759, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.1676495735, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2291132016, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4913453087, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2291132016, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4913453087, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.1139393936, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.0008893632, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.1102093996, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1240576859, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4089802134, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4077774236, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1701935253, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4455315746, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0893298382, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4122387286, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1035888572, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3618355572, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0726047699, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3350719307, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3569856992, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1275291134, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4127884602, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3867446669, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4331286519, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4168975502, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4173686439, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.262694995, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0720941576, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3406591924, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0583448239, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3034708946, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4345822107, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.382872078, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3795844422, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0701205311, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3123716746, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0723796361, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3405017839, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3681425965, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3856352748, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0876062629, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3978552284, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4423346653, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1137820494, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4981472095, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.090580172, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4729670967, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.090580172, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4729670967, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4098374119, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.429661484, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3614767738, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4537465621, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0740936355, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.496756597, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.113352035, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.465280802, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.108829547, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4177339268, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1075589699, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.402033296, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1056139345, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3623154874, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.0087762186, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0902660698, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4602880143, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0605813979, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4408463415, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1059352062, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4291550754, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1531185236, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4119139452, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1531185236, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4119139452, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3916082207, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4665993964, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0584081734, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3534207449, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0884181804, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4777238617, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0678480312, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4265201702, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0917138923, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4735677694, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4750212573, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.120388539, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4736275152, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0787541827, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3869074207, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.003607065, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.0957747946, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1116113366, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4277891734, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1170905824, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4050787124, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1572052717, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4788228539, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.091169769, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4065732714, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.091169769, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4065732714, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.2973352935, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.008495716, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.1018469621, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.229159308, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4771446399, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0792538876, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4921799712, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2756083223, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5392779492, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4234873239, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4034951021, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0678699362, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3421484177, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0830216973, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3447730756, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1278532052, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4661345992, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0861310683, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3975508888, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0982484178, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4109236039, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0888135621, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4336116693, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0769601895, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3952360824, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3201590349, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1469165825, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4160690364, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0392904488, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3378344273, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0758360142, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3751893803, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0764973188, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3813049789, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1448356871, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4535485865, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1044467505, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3816652428, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.059827932, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3623097221, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0562236516, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3446090827, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.0211390008, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1166376461, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4124178868, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4225390231, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.1649671153, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.1558150733, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.156955031, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.1118303682, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.0008855827, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.0008837045, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4534606453, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0702412758, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4729426711, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.1654397657, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0754571307, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3506817414, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.157598024, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3556085508, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.1113696975, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0765259308, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.360242963, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4263815701, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1250646012, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4614017513, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1176520159, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.474727527, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1190612733, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4639300246, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3866869165, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4729772499, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.0009127419, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1387063186, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4884269892, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4238256552, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3248502808, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1289863678, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4211070413, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3934934793, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1124001584, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3755998557, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0935423784, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4409559218, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1274850671, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4508210684, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3807183677, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.101271711, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4525620765, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1405561261, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4124924918, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1385564427, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4023498311, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.2172505601, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0740225327, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.391077727, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3225074205, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4536688337, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0768612766, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3776399756, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1282663066, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3656192284, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1199341863, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4771538581, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3703390568, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.06018687, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3434593498, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.0492666991, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1004106469, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4419310176, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1405908234, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4599803739, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.141632992, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3958314878, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2081516664, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4554402553, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2081516664, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4554402553, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.2854365803, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1257518553, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4474760312, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0500780021, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3609874594, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1290651092, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4316039224, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1037125612, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4718081522, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3339687894, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1240861632, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3876257745, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0967684049, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.417806465, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3185508911, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.1366145931, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0710569903, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4048096993, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.117575195, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4440750545, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1200100437, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4636227306, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2018735692, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4845029277, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1706151562, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4576821113, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.381059511, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0894115487, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3829533852, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.1950507243, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.139423171, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4593597039, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1266453889, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4661468775, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1785750236, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4334421204, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1650868026, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4714504121, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1573543229, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4721332408, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0484986022, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3379527544, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0786211268, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4059503829, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1440031282, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4325604623, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0402860747, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3532348375, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0628957079, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.381388117, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0992035455, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3977340411, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1002646969, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4029197069, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0536448069, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.367820316, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1029351763, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4165632659, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0548436671, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3482099923, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1005114738, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4554345525, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3553498646, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.090421471, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4505535136, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.156702536, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.46637404, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1031315156, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4069435434, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0701281752, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3697200812, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0826957641, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3818515619, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0501425278, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3803262907, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3489532011, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.190456797, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4124342445, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1318651586, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4331981792, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1302091241, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4303732604, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0745423297, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3206098286, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1068536272, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3771843601, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1023687249, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3655843516, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4300304627, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3423817261, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.2412099573, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1596949542, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4493675427, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1188257647, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4137309804, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3052529257, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.2122968331, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1050049247, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3530645226, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0698088434, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4119294666, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0527592302, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3724723204, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0921222182, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4009305713, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0921222182, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4009305713, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0518279709, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3356084649, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0639497921, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3855824296, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3850936816, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0723799, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3785450894, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3862862498, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0896413162, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3962711439, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0842991092, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3783947297, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0892930307, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.38125907, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3702634246, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.0211881162, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.059737096, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3374204881, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0798094979, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4142041527, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.1265080981, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4579202272, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.1579087295, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4587242582, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.1579087295, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4587242582, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.2703148103, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.0008494733, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0681137628, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3973370121, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4580958607, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0764396383, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4790280948, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.1348878986, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.451978804, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.112483373, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4740845297, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.112483373, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4740845297, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3695518314, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.0373566711, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.1590755116, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4524235916, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2415826889, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5410427858, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1913552328, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4994780514, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2128223811, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5048999729, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2128223811, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5048999729, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2068937728, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4991818748, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2128223811, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5048999729, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.204006346, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4911943731, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2192257679, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.493906997, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1998967244, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4954677323, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4522625001, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2316796382, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5128772172, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1545508748, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4692608507, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.211191438, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5030156541, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2128223811, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5048999729, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1146920231, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4773635651, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3798211577, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1058861281, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4068718482, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1034927523, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3964622986, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1007827284, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4064722661, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0541154953, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.326151405, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3816046242, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0976968, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.348984186, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.120444339, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4241018127, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3326031647, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.069862804, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3551358761, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1151138596, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4390413777, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0554945103, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3537313942, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0463757348, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3494774272, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.248025635, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1501723789, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4481403581, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1685272693, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4770045428, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0967458811, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4485783192, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1425945748, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4433395106, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1292980198, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.448116395, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0508964906, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3323165831, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1215444015, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4781074822, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0745452451, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4226523751, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4509406663, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1214060468, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4867949101, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4257191895, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4447505575, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0679075089, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3646185253, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0658060541, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3925312277, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3413034268, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0930906032, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4298405489, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1022689845, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3160216877, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1330873945, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3932447623, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1594511174, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3874937023, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1622298454, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3853884541, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0459035054, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.359090795, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0655311225, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3473660157, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.2874604387, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0809078049, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3980111654, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1363414938, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4566019632, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1053994975, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4337252582, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0831307815, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3775192885, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1170522839, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3876750317, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0694594154, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3753282438, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.0017825312, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0608256269, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3677720077, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4003081125, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3645369665, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0719729482, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.324495728, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0888682354, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3395357801, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.2954316288, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.1350858706, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.206251433, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1074470458, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4113914052, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0615992235, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3907129962, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0812127106, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3834712472, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3461341635, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3120575186, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.127039314, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.36503714, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.2512259104, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1421446895, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4331731102, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3798877864, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1545374648, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4413516563, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0574372412, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3567809954, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0547402856, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3326088943, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.212628609, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.1457144765, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.0995997993, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1158467153, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4340544251, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1082417479, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4249858141, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1336446465, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4204857168, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1064294454, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4272539644, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.099942084, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4116031652, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3077903381, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.116652364, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4070049033, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1071314857, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.415221117, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0911770522, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4370648066, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0911770522, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4370648066, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.1585163492, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3944339442, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2901032948, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4162826479, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4023801362, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1176594164, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4498450226, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3814511365, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3783361329, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3173115828, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2862195368, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0882441366, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3977541835, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3292309575, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3702987017, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1557626829, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1555926073, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1722828487, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.0008931761, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.0931875173, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0710572276, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3833002336, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0669996531, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.395356259, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2594621784, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3775667654, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2677919775, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2821488742, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1925881801, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3162255424, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3167335562, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3071885377, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0870411568, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3065421855, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1218935493, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.346453894, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.1614090408, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.1103895088, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.0892362305, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1623104335, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4771296527, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3947523667, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0909220667, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4200146131, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3701108639, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0653470542, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3665033088, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.1050547201, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.1082325532, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.1084979261, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.4432352691, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.7203175886, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.388706742, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.6484380085, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2390492201, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4803366377, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2390492201, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4803366377, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2471587379, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4905179281, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2416561876, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4975964814, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2390492201, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3399292774, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0054491617, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.0261580293, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0054491617, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.0261580293, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2450810477, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5725552336, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.3360821338, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.6155314069, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.5091686102, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.7212096272, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0592258122, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3415915216, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2080125861, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.2670350854, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.3531504096, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.6258951885, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0672488842, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3966748061, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1113399676, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4410280354, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1193019148, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.381276479, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1193019148, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.381276479, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1134644651, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3675317023, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1138130544, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3712977178, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0988017723, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.329763835, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2377604053, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5690390534, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2257340881, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5444672928, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1074271647, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4269485915, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1907336359, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4989538294, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2382348118, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5209651953, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0437839432, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3208878745, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1474587003, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4751706379, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2868985879, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.591501744, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2645953895, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5272178908, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2133951876, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4808734552, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2133951876, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4808734552, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0122014538, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.0630508172, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1314431278, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3988554849, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1754678706, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.2631827194, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2434257081, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5341782261, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2941675978, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5906648119, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2584847655, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5525933857, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2407129896, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5438509852, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.3018146853, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.574226629, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1524391968, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4040108218, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2063890417, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3856767885, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.3295566055, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5816133442, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3428955164, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6023036718, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3563758622, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6037023613, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2347648664, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4773200603, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2407129896, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4824631769, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2632018059, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5013027198, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2119023555, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4239461618, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.202600477, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.264236181, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4538010737, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6446834621, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4537725564, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6400294743, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2058673668, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5693016623, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1455399827, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4504825147, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4537725564, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6472259254, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3224480216, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5927918264, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1758665551, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.2758687847, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2948978499, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5529453974, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2903774731, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5917006931, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2158914622, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5448184156, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1435400751, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4107294811, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.143828549, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4429424015, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3915235765, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3628970589, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.263803328, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.4054234087, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6673047516, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.0197185083, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0817534097, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4308342322, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3268233488, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6084114124, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.399705432, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6701057244, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0578550959, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3713083116, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.0475993764, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2500653935, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5855288679, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1204950506, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4930503943, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1803130734, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5221644548, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0107906037, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.0893376097, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0832124641, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4202131285, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0378749842, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.1308309461, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0781107061, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3658749228, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0104834969, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.0555654153, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.3086504522, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.615174809, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2846319621, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6104886551, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2006411049, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.520576163, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1573857459, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5347526445, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1766483676, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5371605646, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0601807787, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2928392755, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0081800691, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.0460587753, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1390432069, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4716936508, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.367816899, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6454684778, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2999092588, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5505916495, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2434410061, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4904649875, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2434410061, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4904649875, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2772655015, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4799723286, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0569456532, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.1070378443, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.187397552, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3146671919, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0054491617, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.0261580293, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4472334739, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6623509161, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2516768028, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4957220977, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3471036105, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5663019495, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4046850803, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6187842062, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3122980432, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.547253828, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0090709643, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.0685240447, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3212066202, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5836558214, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4980453293, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4263684749, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4128899494, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3835625858, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.422857407, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3626737185, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0567604154, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.2982745415, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3946429129, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.6481030286, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1885699317, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.574221547, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1112650985, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4338923577, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1723649106, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5548663879, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.2383229028, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5742431739, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3797999858, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3540506409, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0890609288, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4317746285, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3078367779, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6417108947, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2562849004, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5767019342, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1708279669, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4638787181, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1985174302, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4979362156, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1174973452, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.380078153, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1692546646, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.3242354182, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.4446493539, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6962239473, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3936136052, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6453682761, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.109547829, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5090382887, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.283448433, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5201572705, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3348517042, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.586470904, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.251095495, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5187154029, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0065693329, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.0608641961, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2756885721, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.586707787, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.2162882016, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.5347607538, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.24658885, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.5221084446, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.193759007, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4417223478, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.193759007, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4417223478, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1324062816, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3347576435, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.149905493, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3679304886, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1595501169, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3036044023, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.370818391, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6563960893, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4367441765, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6420436201, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.3137233353, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.5741396495, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4583603883, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6713553243, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.457706572, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6651583454, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0907454262, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3474348332, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1007706206, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.0976048286, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.2600884211, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.531430107, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2537710754, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5898314099, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2215037081, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5463488388, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1822031057, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4903627893, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1822031057, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4903627893, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1457440266, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.427554376, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1491797471, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3881363329, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.134697415, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.2344127632, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3319944964, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.6676204565, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3410035629, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.6673519559, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2475002812, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5894646099, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2687379663, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5826619908, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3319736336, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.6622924174, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1549337617, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4612953862, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1589733361, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4496168003, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1508931842, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4042478943, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.316646483, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5144731748, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3946181132, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.565520411, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2460808119, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4231213699, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2452766493, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4209094498, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2196725747, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.374139067, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2377205844, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4142852642, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1822721151, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3382801866, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0054491617, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.0261580293, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.4624783675, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6143805843, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3116520879, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.475177924, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3627923368, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5255399247, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3425544778, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5070430597, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2209272285, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3959441218, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1287037621, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2215145117, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3018146853, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.526180278, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.3842999367, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5816504483, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2556417714, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4987001162, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2582739151, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4946279038, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2582739151, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4946279038, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2794641523, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4938296655, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2377099561, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4452519937, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2883396105, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4595830151, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.5465908824, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.7387035187, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4260570739, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6273945682, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2692560123, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6050395148, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4323587716, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6144858674, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.514056486, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6829131725, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.3017931626, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5734438795, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0129511125, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.1188227704, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.3272963527, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5715613564, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2258043389, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.5281957185, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1598584071, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4495105333, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1549337617, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4181663628, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1549337617, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4181663628, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.179205314, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4522763056, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0915032166, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3782062666, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1604629854, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3770931135, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0054491617, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.0261580293, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0054491617, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.0261580293, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2619940054, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.580482787, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2053325029, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4968181034, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.284672153, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.5192330976, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1672112091, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.5078446329, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0950330052, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.253555451, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2037817226, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4860000824, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2573392925, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5328565784, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2721758985, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5756343667, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1219255025, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.354893184, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1219255025, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.354893184, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.158138598, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4460734029, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1277236961, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3877116206, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0098323728, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.069950039, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0054491617, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.0261580293, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0054545014, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.025252054, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2053325029, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4597563508, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.3077422017, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.594367382, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.3077422017, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.594367382, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1008184365, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3816541008, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0956457151, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.190700911, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1035315356, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4021541036, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3020162744, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5582696703, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.284672153, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.429805282, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2114773474, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3936506204, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2114773474, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3936506204, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1935893403, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3468163065, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1836680713, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3534547964, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1286057341, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.2808359248, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3800528767, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.6363479287, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3295957765, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.6259287395, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2432845012, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4275623226, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.383259261, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5920204218, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.383259261, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5850640222, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1059945314, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3342872229, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1918099259, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3308002143, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2230570607, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5202782712, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3067966119, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5967827152, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1542676523, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4528962596, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1625157206, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4012344465, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2290847694, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0047701958, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.0374656656, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.158055386, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.411594036, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2067556332, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3349039842, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.622575201, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3057322896, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.582179666, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2324010239, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5335795368, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3148724833, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5905881236, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3599498756, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.6548318752, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1580450005, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4016522361, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.0350999224, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3020447394, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.539463539, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.7409995287, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.9017022389, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.7096224668, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.8862932371, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.882190725, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.9431233924, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3979309387, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.6648788692, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.7147882714, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.8408773556, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3359230828, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.57308612, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.7106361352, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.8390104108, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.777055454, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.9260678177, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.8767740197, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.9055624233, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.8627586294, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.8964369717, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.9082489096, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.9677853955, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.406750508, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.629072095, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3371375731, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5731908179, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2493112668, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4453900014, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2013498447, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4759326319, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0114390994, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.0710901115, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2078672147, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2617811878, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.4840047963, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.7068360974, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0054491617, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.0261580293, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1823619818, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4546828651, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.4710304492, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.6951644806, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.5068325976, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.7027078356, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2479382788, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4560817653, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2078672147, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2277258179, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3646359725, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5937597266, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2571503337, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4370732967, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1912914302, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3904734455, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1147085652, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3110379721, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1147085652, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3110379721, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1273150539, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3354785768, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.116574788, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.2959661547, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2055434718, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4145758428, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0054491617, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.0261580293, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0054491617, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.0261580293, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2541277778, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4083801145, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2481451415, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5127275551, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2941675978, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5720229383, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1361285171, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.2916549695, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0440854328, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.0536282471, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2500984052, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5100793539, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.3785695085, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6309392506, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2705794901, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5644281635, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1436158053, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3817908835, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1436158053, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3817908835, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1676495122, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3695910508, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.229713206, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4379547539, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1839576032, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.2651734406, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.3741624128, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6754691164, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.3556383209, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6120361599, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1930040362, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5728224508, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2799103318, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6172633503, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.3888403695, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6733543866, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0322335194, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.2249430587, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1549240256, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3125746694, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2323385181, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5357993047, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2181538317, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4682927597, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2428517224, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4655392376, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2452766493, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.484628782, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2452766493, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.484628782, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.008072417, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.0638829524, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0136162147, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.0583054295, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0106593966, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.0619556376, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.5091686102, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.73205138, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3297870802, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5720518025, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1985174302, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5474682474, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3415343338, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5541872808, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.4024358403, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.6233256625, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1522227534, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4114953475, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1203104149, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.2540681993, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2191094271, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4572726847, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1221178128, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4347129561, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0727637531, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3886183939, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1465186014, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3998401696, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1221787241, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3801321934, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1112538229, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3636258924, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.057866883, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3224621534, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.119120742, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.282571716, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2475950284, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5238368455, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.257978243, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5649286214, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1628565646, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4184572059, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1752818941, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4632619281, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2265973317, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5133896303, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0719816959, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3447650859, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.0615089586, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2048432252, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.499668842, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2378267889, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5516686848, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3520553563, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5769772651, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2031034196, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4246920221, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2191094271, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.417561662, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1960463553, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4335041535, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1927168037, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4181794106, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.199852716, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.319624988, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.4296297517, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.6526674281, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.4116779987, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.6679764037, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1905758291, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4425716792, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2799506948, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5700777643, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2799506948, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.571487805, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1958641343, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4237067935, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2904194746, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5399262338, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2363347557, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5588648359, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2110833281, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5847750744, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1490671938, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4338972266, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1490671938, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4338972266, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1543252261, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3797469087, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1649662542, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4276666256, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1409879075, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3116234879, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0054491617, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.0261580293, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2721758985, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5875203797, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1661717974, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.481170266, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2358449401, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5389135952, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.3317416308, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.6310870942, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1606777497, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5196854931, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0119615938, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.1017181293, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2727180443, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.6231583015, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.3082995366, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.5552978545, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.3520774812, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.5735788202, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2466475164, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4926614281, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2471587379, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4876485133, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2336554865, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3869598157, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2337426077, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4481831081, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2064415644, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.275694494, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.3563758622, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.6152190693, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.3602927399, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.6148633329, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2024192471, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4785445547, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.329174567, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.5666889548, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.3561691349, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.5927193326, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2698654984, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.44143781, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.202600477, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3027081888, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.273537982, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4703704191, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2369634784, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5659243375, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1506914982, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4940985004, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1373110293, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4144705269, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1373110293, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4144705269, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0999329828, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4818038599, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1184659269, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3317492265, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0971651629, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2740071858, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.0163812579, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.0197185083, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1176029704, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5037771892, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.311786811, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.6235184561, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.3902940037, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.6594442432, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1028840244, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3793737662, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.0054987474, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1850249528, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4977490366, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2772655015, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.5163486941, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.279729003, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.5092945861, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1793807477, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3700416466, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1838080698, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3773267167, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0431674226, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.1451363418, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1511810638, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3824079628, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.1623128779, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0054545014, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.025252054, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2442096106, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.5294098428, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2078738911, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.5395612843, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1910791231, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4745702643, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.248223953, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.5350941461, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0610440884, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.2770877905, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1822721151, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.2673992651, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2244921782, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4854786915, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3432429128, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.6000833981, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.2603680277, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.525575209, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1545474372, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4385517124, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1261143541, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4168654071, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1771478795, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4959629507, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1597949311, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3970575034, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1180533497, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.2935516229, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.4427450628, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5831413075, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.4980380502, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.7169270445, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.2479382788, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5551406879, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.5143871786, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.7463887744, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3817026511, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.6579835999, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0937548553, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3899074238, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1568616677, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3333409033, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.2256379391, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.486328318, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2425369392, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4604841587, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2403409204, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4624667457, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0645228831, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.1340641152, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0645228831, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.1340641152, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2181538317, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3744477364, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.127299923, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3412348387, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2339053692, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3436066938, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.3336658628, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.5974517288, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.3239689745, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.5878660876, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2299157921, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4195683528, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.3529455533, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.5455305267, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.3573039794, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.5470354051, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0977726245, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3252901824, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2119156724, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3783561288, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2315035513, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4851716246, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3217968952, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.5555275088, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3559247479, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.5565115126, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1855346841, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3940963549, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.190490911, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4006079291, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2062051323, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.411920981, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1837965191, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3612486867, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0166801725, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.0493773158, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0054491617, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.0261580293, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3856586473, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.660713981, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.250554711, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4803657005, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3729459505, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.5981276629, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.354514448, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.596597145, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1514682562, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3378568688, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0034593773, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.1058791034, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3295957765, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.5207914581, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.3268233488, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.534280578, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.270750755, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.5201549, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2306483513, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4550457003, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2309503728, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3955361403, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1154677212, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.2604812246, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.098150962, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.0857185441, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1334566096, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.2553729385, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0054491617, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.0261580293, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.417598414, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.6502955434, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2670989083, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.5611797797, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.3658141332, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.6386889737, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.3748533898, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.6415822794, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.170010781, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4015793527, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0796466221, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.0820938247, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2475950284, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.5330580248, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.2735686394, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.5735412935, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.2666372228, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.583913267, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1676495122, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4477014617, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1789375751, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4768883481, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1649662542, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.447328943, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.190490911, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4428914783, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1983497625, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4190981087, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0054491617, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.0261580293, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0054491617, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.0261580293, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.2081220992, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4762583476, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3014043687, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6234338872, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3800258815, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6549174593, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.2600485005, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.5795275013, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1358234428, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2323305009, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.2704580389, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.5815404493, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.3057322896, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.5337455378, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.2667836062, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.4889374374, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1286956742, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2959351859, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1287037621, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2961496633, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1248655762, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2904789102, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1059786102, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2561557977, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.109083703, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2464850028, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.3664435775, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.6024962574, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.2934447092, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.6498290192, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1355166881, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.4424571214, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.269748293, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.6331597127, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.3304755731, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.6190675011, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0532700379, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.230366361, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.103698167, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.252769107, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1193019148, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2629540344, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.3845928642, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.6331548374, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.2391987762, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.5302876334, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1992314068, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3879456292, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.2071184025, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4418611389, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1465911128, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.307998819, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1793559985, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3590687067, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1069893156, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.213618885, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.370423466, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.650430348, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.2452766493, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.5385267265, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.2736255492, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.5566377411, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.2940297877, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.5428150223, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.288476769, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4969423609, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1509387355, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.2693941895, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0620372606, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.0682407232, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.2119156724, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.488968745, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.3693450793, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4718547624, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.382496263, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4097623419, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1477219991, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3092919093, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.3387562718, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.447855974, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.3693450793, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5103516765, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.4155813233, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4704204244, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2423441824, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4429509374, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.4646232199, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5678926447, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.6064630666, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.6752055522, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.5357110024, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.6365941773, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.696091741, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.8209757785, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.7329410356, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.8468261925, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1537137193, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.33229372, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1479026426, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.2715976759, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.4751132439, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.6849386986, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1385781431, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2613639178, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0863580005, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2181093713, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.1979417957, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.1979417957, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1398001346, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2510112236, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.3479159475, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3638143922, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2023307409, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3746629493, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1767874865, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3180770066, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.3728487543, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4488840104, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0925329499, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2110486161, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2887308473, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4165448483, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2971085373, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4168101139, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.1907589726, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.1245338934, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1415437573, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2594145364, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4272870064, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5425603129, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.5642761728, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.6181373707, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.6458552885, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7468283944, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.6458552885, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7468283944, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4440750606, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5402588602, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.5354063184, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5965096072, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4412006373, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5905813393, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.6242817472, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.6834390596, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.7329410356, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.8247196817, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.6458552885, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7468283944, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4331017717, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5345334109, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4440750606, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5402588602, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.5411953361, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.6208023495, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.2648197927, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.3212854968, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4717132762, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2704657013, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3736509639, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2615858283, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3544753095, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1787854024, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3656823493, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1787854024, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3656823493, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2553063553, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4224404198, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3467495877, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4348853299, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2964215119, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4213813461, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3014785663, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4883780556, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.5805399561, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6599074621, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4439209066, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5678926447, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4089156878, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4652232922, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.7329410356, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.8468261925, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1479337875, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.2894223556, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1143643336, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.2322197174, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1858098589, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3347249292, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1288769653, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3011436843, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.151385146, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3237497764, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1801210738, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.303186027, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.186930008, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.2921403403, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1544458228, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3343587267, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.291600602, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6110386192, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1708005297, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4129513432, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.4331017717, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6107152354, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.163697731, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3525432121, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2381726144, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4482866117, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2067984532, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4763649461, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1960463553, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4861187555, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1438055362, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.2597661792, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0914782711, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.325876252, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1496597508, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2221350278, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1560424227, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2255928425, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1406853565, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2236993941, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1464393786, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2280856445, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1496597508, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2221350278, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1496597508, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2221350278, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.240996462, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.4084256741, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4989742135, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1818060822, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2765353482, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.3160946016, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.407876439, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1746624011, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2719194508, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1598051812, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2292736049, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.1231636546, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2615858283, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3586291842, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2169036581, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3306582665, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2472851569, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3088155734, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2133316442, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3391141279, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1139185695, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.2717713022, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.2771846161, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4578226095, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5187171262, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1989591392, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3871693346, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.6230832294, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.70254087, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.6052987577, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6657086816, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.536592063, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.627403903, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4578226095, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5406296, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.6676191941, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.813871099, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.1802926862, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.0020542317, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1228699602, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3156766874, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.368528912, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4706235856, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3532035105, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4910213297, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.204212837, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3132427424, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.2001670148, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3176647236, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1582036217, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.2249046365, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3693450793, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4918148373, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.4618138251, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5392962546, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.4185938788, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.6016367462, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.4192761856, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.6279656551, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.4753167452, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.6372909532, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3831792393, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4797562498, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.5426924329, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5783770796, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1634124231, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3008646672, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.2054194471, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.2567840481, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3704514903, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2066418182, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.3713596877, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2366036239, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.3415269784, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1477219991, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.3092919093, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1477219991, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.3092919093, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3693450793, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5103516765, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.458703244, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5232464635, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2360372104, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4074433071, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.6230832294, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.70254087, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.6052987577, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6657086816, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.5357110024, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6365941773, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3676308285, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4563714051, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.696091741, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.8209757785, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.2651756542, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.1693597635, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3126851492, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4199072509, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4388504279, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.8080705633, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4841156774, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.8256726071, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.8482942955, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.9256238041, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.8363600587, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.9912737183, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.8895260356, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.9215559913, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.6018154976, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.7669980679, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.8482942955, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.9256238041, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2248107417, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3761108267, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3458989585, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4479204267, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1439778619, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3331521962, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1458752125, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3305597684, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0819753973, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.2552663483, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3301877574, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5054531555, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1514631652, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4192400624, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3032929625, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5077415448, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.4399465474, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5758276579, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3730786951, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4740166009, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.382235936, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5729676576, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.382235936, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5686739422, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2171185208, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3407697847, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.1932896646, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2047715641, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.337172818, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.0079346775, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1998460736, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2932603148, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2674274418, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.290662742, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0893927012, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2952752522, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1307118752, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2556075727, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1954598433, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3260504123, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1772984226, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3337514619, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1634124231, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3022768387, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1709586441, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.280574965, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1395211838, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2962794525, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1307118752, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2771420975, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.1907005288, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.0287356322, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1767008775, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3136010782, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1350236732, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.2998597453, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2727419107, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3743643897, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1333497993, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.2559597723, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1333497993, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.2559597723, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.5265891376, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5667866238, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1798194942, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3488441223, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1785703341, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3263243536, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.6230832294, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.70254087, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.5805399561, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6599074621, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.6244631487, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.7155411017, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.696091741, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.8209757785, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4307079424, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5011615373, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1966586469, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3691337711, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.0195165738, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2241905682, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.357730604, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.3166144686, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4171828599, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2434330428, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3185890038, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2543031675, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4159778448, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2538149474, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4177779283, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1508482523, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.328488685, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1508920852, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3228112224, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2885535727, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4423533755, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.6230832294, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.70254087, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.3160946016, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4791760084, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4452652852, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.5889782978, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2677353447, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3932141709, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2732665373, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4001542443, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2335943386, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3616178262, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1536690667, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.2337346283, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1680010297, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3319781988, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.248781805, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2400752825, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3108446705, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1241665906, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.2314102878, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1241665906, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.2314102878, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1276902706, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.2184436083, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2685378335, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4156633794, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.1659971111, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.4246183605, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5497460512, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2252369759, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3911595396, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2370526644, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3838188339, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1852972751, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.366604121, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1634124231, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3389374743, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.2469646873, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.2653698485, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3730786951, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.408087192, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3674668905, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4097562809, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3615855225, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4104273002, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3615855225, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4104273002, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3931807596, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4158735804, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.4154606003, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4643168082, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2212877653, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3299817815, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.4516759457, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.6430302721, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.4578226095, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5429809487, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1767958813, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4098986064, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3675058902, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4451716384, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3811228251, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.458075344, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2556795749, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3431135837, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3196352513, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.291070873, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3951783328, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.4092112922, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.462803416, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3763743474, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4120099199, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3615855225, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3998925449, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3615855225, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3998925449, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3479159475, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4086436809, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.4093301993, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4471788729, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2127127537, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2964311555, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.4526762557, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.6356631092, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.4516759457, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5192073148, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.4056782022, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5237454578, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.4092112922, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4428945231, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.4245970617, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4579580789, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2733459421, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3492664331, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.1397818378, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2134385691, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2969932315, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2069099661, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3003619338, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2327080491, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.347858964, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1925775824, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3523071217, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1925775824, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3523071217, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1123490599, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.1522525152, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2253492144, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3055805564, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1346180129, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.320287943, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.6230832294, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.70254087, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3869431776, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4758624095, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1373389435, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.2635601633, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.158781743, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3163237076, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.220957314, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3344327761, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.2113573875, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.0143792156, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1294364849, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.2994283154, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1961887304, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3136840647, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.224530027, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3354597456, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1491744506, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2367201175, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1491744506, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2367201175, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1206145072, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2822786212, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2448987534, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2193664451, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3266422289, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.6230832294, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.70254087, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3011172971, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3734627919, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2651812298, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5148468754, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2082376264, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3665582909, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3159148238, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5258141914, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.0034435262, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.0109170306, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2231669815, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.2187746652, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.1834152453, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.1456734389, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.1570303225, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.3020103088, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3662566369, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.3185739649, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4268500782, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.2623469367, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.4772894233, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.627230008, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2852650068, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4720929044, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.2523841428, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1114672746, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.2396902718, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1410002458, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3371303924, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.1820475071, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.1123102665, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1772984226, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3230516835, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1185666012, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.2206684365, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1278953338, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.2283763804, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1051184684, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.2084977525, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1051184684, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.2084977525, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1350236732, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.2597905925, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1383436846, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.2622351749, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.1733481974, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.4349750776, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4492746395, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.168059369, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3269489742, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1627934873, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.314963929, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2820004916, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4068212169, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2820004916, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.380937583, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.2006919097, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1240959712, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.1944925525, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2808924132, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3924166546, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3571150501, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4464287682, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3359540718, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.433506473, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3926492355, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4617232533, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2727419107, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3975634914, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2538149474, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3194196589, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3759019493, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4642775124, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.4470252726, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5551045432, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2595185903, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3440658218, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1323229159, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3103406768, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2295748847, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3277581849, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2733459421, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4045014812, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1190200191, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.2714975492, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1904070085, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3541764955, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1022875702, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.2228850613, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0896823525, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.2175311081, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0717463028, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.1763343461, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0669590069, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.1718001136, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1064085069, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.1526683807, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.1725958266, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.0991866184, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1060131743, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.2251385458, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1633065747, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3368814282, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0981216326, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.2390978511, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1040157761, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.1618434772, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1060131743, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.2305932306, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1085135458, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.15031519, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.006827911, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.2164910349, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1029370477, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.2508347331, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1472462377, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.305253102, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1068282725, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.18978046, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0994149095, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.2289718867, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1959280139, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3670813175, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3634336506, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.432454548, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1532674182, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3141572038, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.5805399561, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.6804343592, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1379662085, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3011443479, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3166144686, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3931514398, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3761648431, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5466736283, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2910873659, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4001749131, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1088426762, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.2489918633, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.2600792506, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2616747577, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3913455745, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.3131422481, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3932583888, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2921936291, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4376778735, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2921936291, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4376778735, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.3615855225, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4838257583, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.4501609222, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5565610322, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.4315505267, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4766479849, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.4671778989, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.583541923, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.4441171231, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5742558726, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.4671778989, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5801543736, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.4501609222, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5779114322, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.4501609222, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5779114322, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2633684432, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4212549338, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.061704849, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2719977823, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4129085501, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2637873056, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3076866807, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2472851569, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3122169397, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.204212837, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3589029375, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.204212837, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3589029375, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.1695455529, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.318008567, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2100485023, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.2695278236, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2432822124, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3587841405, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.6052987577, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.6657086816, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.6064630666, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.6752055522, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.4148989571, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.5351666707, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2505523539, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3831975161, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2324422363, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3586451994, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0969436154, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.2353989149, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.0361680929, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.1900414584, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3699750032, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.184327699, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1204542218, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2218401335, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.114343382, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2022592744, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1494197913, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2347938067, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2122363344, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3152057664, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.3859348084, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3825784968, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1156308445, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2417806321, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.3925121365, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4964717586, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1784687728, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2823226788, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1532685995, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2563896885, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2595753046, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1691896235, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3068908283, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.182230588, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.3360020595, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4979723869, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.3306242913, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.48871289, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2951516238, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4006514402, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.283078907, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4006557495, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1827974487, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4024804883, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.4461240556, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.62456731, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.1005094239, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.4298810543, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.576564253, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.497644808, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6328520698, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.3360020595, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4979723869, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2676032276, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4068945858, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.3839162952, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.5154389469, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.3307203629, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4908642531, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.2231944965, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2330781491, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4116769065, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.1316478147, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1353668111, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.2359597252, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0793908715, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.1100663745, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0793908715, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.1100663745, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1185666012, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.2130317058, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.1649415533, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.0986549882, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.4027788022, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5140425251, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.2536955092, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4403746462, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.2650521146, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3924854247, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1601125708, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.2375277828, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.143779191, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.2548981392, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.1200550028, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.0339089194, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.1584358964, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.3615855225, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4063549118, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.3479159475, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4062384533, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.3996921471, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4394299727, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.3996921471, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4394299727, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.4154606003, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4663335537, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.4390960898, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.5164819147, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.4525447569, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.6016367462, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.4246183605, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.5045638982, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.4578226095, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.5429809487, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.4390960898, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.5164819147, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.4092112922, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3918928771, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2774870274, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3718928736, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1600733594, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.2350173429, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2718226943, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3135936385, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3917196589, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3964644744, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3373755459, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.369875666, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1423412184, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3114279239, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1863161938, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3613802877, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3780488662, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3874953836, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3780488662, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3874953836, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3040122368, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3640142384, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.4435790342, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4885452282, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.4435790342, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4885452282, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.4246183605, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.5019489573, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3200158957, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4105050567, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3252211131, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3743770395, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1767445235, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3030436823, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2116370043, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.2754475816, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2543770619, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.2885872184, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.3479159475, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3998134582, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.3924259175, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4246539837, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2144862947, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3142841654, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2144862947, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3108688605, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.3120848454, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3705328519, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.3865695386, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.388047078, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2047715641, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3021617561, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2082633427, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4395502164, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.4185938788, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4981521959, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1805915447, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3333808784, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2733459421, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3569072627, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.4154606003, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4397124903, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2732665373, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3528072459, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.3127760081, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3423771857, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2594432023, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3049825437, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1375090231, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3476437558, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.2102754594, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4572185176, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0981216326, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2684447524, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0950026632, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2717648187, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1411399193, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3385181303, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1462806365, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3207408262, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2560038657, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.5204944454, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6659376403, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.504080218, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6292677087, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.2538333923, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.462858458, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3071373083, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6108807661, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3175634859, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6126383724, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2279713172, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.104552581, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2276648082, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2140405179, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0863580005, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2387557372, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1141463319, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2503197875, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1615634589, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3073644007, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1615634589, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3073644007, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0741818249, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2636395833, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1145013792, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2307519533, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.2482249519, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3198663637, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1508271374, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2362536212, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.2467176349, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.318060818, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1022763759, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2461976716, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1109277014, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2475262677, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1078856901, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2485245843, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1770481008, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1179949262, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1080439968, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2560670416, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1726893279, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.2845292485, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.181050485, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.2710540879, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.149089608, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.1969983002, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.149089608, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.1969983002, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1099151473, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.2549321593, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.1813000495, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.2015862471, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.4477604756, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.5575708229, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.4125656014, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4889462808, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.3471636178, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4191180487, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1749383057, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.2669026163, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1998573974, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.2618744307, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.1311005272, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.2567840481, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3517975293, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.8003203204, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9453478043, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.8003203204, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9453478043, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.8003203204, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9453478043, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.8003203204, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9453478043, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.8003203204, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9453478043, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.6417603075, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.3770929789, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.6881502501, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.8003203204, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9453478043, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.8003203204, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9453478043, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6364887817, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6290393497, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6290393497, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6290393497, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6290393497, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5285087045, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6520135111, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6290393497, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6290393497, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6290393497, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6290393497, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6290393497, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6290393497, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6290393497, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6290393497, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5344225462, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4954628898, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4057723082, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4519601247, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4160221122, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1884239372, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5622542444, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.429665206, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1884239372, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5646801081, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4134580028, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4971306033, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1619557013, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5816452677, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4638613135, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4173415078, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4292927111, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1667955161, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5848202846, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3331975426, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4085415213, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4043598708, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4043598708, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4164061299, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3494501402, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3758138913, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4056229085, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3327212134, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5709936729, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4056229085, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4056229085, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.466964361, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3354695537, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4031909986, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3128264071, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.396188029, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3099872952, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3099872952, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3933793008, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3955832344, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.389666294, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3032579702, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3066337968, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3892064099, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3010381622, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3118742681, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3933793008, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.2878329791, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3958941272, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4418365362, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5948724603, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5644198745, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4566163202, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5049375876, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4425973012, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6087963427, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5118761227, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5565173534, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5582360999, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4915933924, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.44291963, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4854320704, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4146934197, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3945152128, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3431841259, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2744793826, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6152918483, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2948993987, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5989264159, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2948993987, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5989264159, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3157355812, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6989238098, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1296247288, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5750206459, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1429614563, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5102054231, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3311822752, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.7010244057, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6245952145, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6245952145, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2680165156, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5989264159, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2680165156, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5989264159, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3259481889, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6263180162, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4425650919, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3259481889, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6263180162, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.263026805, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3376229723, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4279680256, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4179740301, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3933660075, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3995247811, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3811737094, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5189004396, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3209453837, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4101715668, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4583484187, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4498692001, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4568577004, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3175422719, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3974726419, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.195647515, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5832256254, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2658483577, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6410540991, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2357831604, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6511343055, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2357831604, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6511343055, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5639241777, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4616072653, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2533654946, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6437859092, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.4513165758, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.7514771577, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2357831604, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6511343055, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.528106198, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5554602681, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1718152967, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6053635787, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.652006546, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4129175011, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1718152967, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6053635787, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.50663118, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6562641137, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4494592021, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4539380324, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.5013632657, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4400698947, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4574633933, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4911811018, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4911811018, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4224991955, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.5379068753, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.5379068753, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4449388482, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3348758882, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4601349894, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4354398636, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5705717737, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4044335714, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4044335714, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4121946181, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4044335714, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.421953022, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3990998963, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4166363621, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4242214542, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5606044054, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4276677754, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4070621794, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4044335714, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4121946181, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2197281387, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6022094443, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3113878808, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6728506998, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2130541362, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6284808905, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2130541362, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6284808905, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.312849684, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1487964117, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4213182963, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2189910846, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.5773502692, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.7999099314, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5323469509, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6371798394, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6423124418, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6423124418, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4703657604, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2970314819, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3292499963, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4425973012, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4425973012, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4425973012, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4425973012, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4425973012, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4402401015, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4550016613, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4440931656, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4483037848, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4746507483, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4483037848, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4936014901, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4466798503, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.2623399284, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.437315621, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4050845737, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3830425593, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3830425593, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3830425593, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3830425593, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3830425593, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3981852532, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3830425593, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3981852532, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3844263765, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3830425593, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3830425593, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3844263765, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3830425593, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3981852532, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2369305576, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6474126202, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1667955161, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5802683404, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1881478575, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6285580962, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1881478575, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6285580962, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6131017059, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5513474668, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5513474668, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2369305576, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6474126202, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2369305576, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6474126202, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6131017059, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6131017059, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6131017059, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1667955161, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5802683404, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1423071533, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5673078469, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1992340566, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6211036406, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1402577516, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5380752589, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.4637878319, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.6919476196, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1769497515, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5437152782, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1457684615, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5633850959, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.6120635843, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.5303624596, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7835371348, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3969996397, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.7487402157, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.9260013113, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3703046834, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7587397825, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5658596263, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1457684615, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5701800422, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3703046834, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7587397825, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1820705281, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5476571079, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.1711057434, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1531682455, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.6009917293, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.509895456, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.1336937736, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5417128748, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5417128748, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.278489988, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.6722683602, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.482808535, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3771310858, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.6062665281, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3805371079, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.7011240865, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2935973828, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.6760199025, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2757185986, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.7434080113, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.6282512192, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1425391135, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5429166339, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4088276333, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4745035228, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3870105243, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1884239372, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5854975501, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4983370486, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4983370486, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3276434616, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.2901099002, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.2736604813, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2014941616, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5911912768, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2014941616, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5931139543, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3782180896, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5070819399, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5076904123, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3643413837, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.1631967966, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3474927846, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.6248961527, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2217994592, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.6249971904, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4454843487, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.448224857, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.514391848, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4519657987, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5327944201, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2217994592, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.6249971904, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5141209056, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5121650809, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.6248961527, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5216428635, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4564432185, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3555531255, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5116862202, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3349461282, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3349461282, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.232197805, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.232197805, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3808585783, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3670228744, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3735326822, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5262688122, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5220875063, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3863760544, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4054892448, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3835470699, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3354067588, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.1727008103, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3349461282, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1769497515, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5836240065, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2897790749, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.666311734, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4842668276, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4842668276, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6245566175, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5617057004, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4991269912, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2533654946, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6547636047, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6309937234, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6245566175, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6285229436, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6285229436, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4182671264, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.2925448848, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.3040559697, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6658994384, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.500271653, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4276859055, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.500271653, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.500271653, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4510059762, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4415898207, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3917642203, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.6245566175, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5211563282, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.6245566175, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.545972294, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.545972294, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.325832365, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.2201179178, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.6212521407, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5059916133, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.481359867, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.481359867, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.481359867, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4782537016, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5118761227, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4935153103, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4782537016, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4935153103, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4935153103, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4782537016, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4782537016, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5118761227, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.464633183, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5063020142, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5963099883, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5963099883, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5963099883, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5963099883, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.6265140754, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5138477285, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.6265140754, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.6245566175, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.6245566175, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.6265140754, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.6265140754, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.6265140754, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5539920925, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.2797982086, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.6056889169, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4671158418, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2102369368, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5768887727, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.195647515, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5857714958, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.195647515, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5857714958, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4808578708, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5309753108, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3859677867, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2102369368, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5768887727, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.482414072, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2102369368, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5876589559, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5309753108, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5309753108, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5309753108, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4814496481, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.195647515, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5857714958, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4903188428, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4877445614, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4891106955, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4717978314, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.6171472239, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4197983612, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3993213728, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.5057748632, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.5057748632, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.5079994737, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4877445614, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.0350284351, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.5057748632, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3112269209, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.5362380779, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3370934794, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4148097948, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4216795433, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4216795433, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3925781566, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4148097948, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4015108797, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3399572784, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4148097948, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4148097948, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4148097948, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4148097948, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4084862105, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3180540561, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3195891679, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2369305576, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.7180407771, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2369305576, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.7180407771, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6535469797, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6535469797, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4598446401, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2722589423, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6049790802, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.627708235, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2369305576, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.7180407771, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.3222538602, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.7495871588, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.627708235, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.3222538602, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.7495871588, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2369305576, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.7180407771, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1884239372, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.5867968824, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.300528391, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.246778941, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.7023973209, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3323684721, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3437729074, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.2984899751, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.2984899751, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.2982854478, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3038662664, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3758304027, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3429275047, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3385645728, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3421048583, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3355517974, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3355517974, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3377353924, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3329758885, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3437729074, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4683918973, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1496284837, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.5531110804, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4867393274, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4867393274, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4193494434, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3546654566, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4113467875, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.5026703894, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4409598753, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.5725197387, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4817075906, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4635207908, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.442353694, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.2075521577, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1598051812, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.6117406545, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1667955161, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6161305014, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.200389085, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6177327643, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.419971174, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.419971174, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1871015823, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6827304461, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.5106967339, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.5084170679, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2125884413, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.631489137, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2125884413, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.631489137, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.5220823443, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.200389085, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6177327643, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1797645143, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.611395499, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1871015823, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6827304461, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.442104355, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3807134866, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6734021595, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4843771361, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.5873831965, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4566163202, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4566163202, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3885961889, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.5387502559, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.1609725589, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.5719181187, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.5719181187, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.5599655155, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.5719181187, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.5148079777, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.6408205679, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.1643286368, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.5589849481, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4133673304, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4133673304, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.412067526, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.412067526, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4332508955, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4599966864, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4173344186, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4787742817, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4332508955, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4332508955, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4332508955, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4332508955, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3756494331, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.405801432, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4787742817, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.2213147799, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.5260789793, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1769497515, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.4902785344, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1861649355, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1934301422, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1995158124, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.166056909, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1514310757, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.2213147799, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.4362962278, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.166174293, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.4651598071, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.4103552603, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1196655751, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.4380729671, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.449673018, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2132673671, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1790439216, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3057729079, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3196747242, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.2079331399, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3303003998, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3303003998, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.2483133576, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3171844783, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.1733265176, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.433431787, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4317729593, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4711738744, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4152730794, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3909799363, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3032776841, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.0128700129, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3452137419, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.8492326636, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9063898435, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.5360330313, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.7676864591, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.5309354663, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.6756014233, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.4529852872, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.6941474239, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.8522456714, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9096914044, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.945741609, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9892952933, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.7912619864, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9129058872, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.945741609, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9892952933, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4741000223, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.7538467008, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4741000223, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.7538467008, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4741000223, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.7538467008, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4741000223, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.7538467008, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4234885228, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.7410180115, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4741000223, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.7538467008, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4737506901, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.7543919667, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4737506901, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.7543919667, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.5738396575, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.7983571334, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4741000223, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.7538467008, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4741000223, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.7538467008, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4741000223, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.7538467008, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4741000223, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.7538467008, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4234885228, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.7410180115, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4737506901, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.7543919667, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4441961115, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7565542719, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.2828367157, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.3781068786, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7413927279, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.3791621113, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7363359547, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4454357881, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7513336774, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4814564802, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7621649609, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.3088448141, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.6673372116, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4818114945, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7675828789, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.5091224919, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7829685247, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4818114945, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7675828789, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.546149954, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7954823724, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4454357881, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7513336774, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.3363225191, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.6803949683, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2404315522, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.491557141, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.3477250471, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7188419868, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4489771072, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.686224909, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4489771072, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.686224909, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4489771072, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.686224909, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4489771072, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.686224909, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4047272002, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6392900614, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4047272002, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6681898018, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1990581597, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5898277017, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4489771072, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.686224909, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4489771072, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.686224909, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4489771072, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.686224909, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4489771072, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.686224909, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4047272002, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6681898018, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1990581597, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6133817758, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.438622992, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4489771072, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.686224909, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2704091954, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6207272323, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2704091954, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6207272323, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2704091954, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6207272323, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2704091954, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6207272323, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2704091954, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6207272323, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3025029866, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6057244918, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2795351131, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5735871311, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2704091954, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6207272323, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2704091954, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6207272323, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2704091954, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6207272323, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2704091954, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6207272323, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2704091954, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6207272323, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2077656967, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5495289426, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4621757042, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2206773105, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5635661737, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.4727805713, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.7717158158, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.4818114945, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.7675828789, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.4063022828, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.7128058031, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.4063022828, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.7128058031, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.4741000223, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.7689532399, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.4441961115, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.7565542719, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1811761075, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5900497115, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.5465526716, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.8012679277, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.691790174, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.8479928839, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.691790174, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.8479928839, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.546149954, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.7954823724, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.4454357881, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.7513336774, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.3719278006, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6470304986, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2401107946, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1992049404, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.61420972, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4300707823, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6680243275, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4596980088, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.713787746, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4596980088, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.713787746, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4596980088, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.713787746, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3335910323, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.7011023633, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2565271158, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5754598856, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2615311775, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6423472233, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.589661355, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.752891475, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4596980088, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.713787746, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.5271017465, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.7749613595, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4596980088, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.713787746, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4596980088, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.713787746, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3014335252, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6287268013, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4335364472, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6878319611, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4807711312, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.7032048787, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3296512955, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.6234369072, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.2470646796, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1862334347, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5383789355, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1862334347, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5383789355, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3296512955, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.6234369072, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3207873973, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5817366082, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.476501312, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3207873973, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5817366082, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.491944035, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3207873973, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5817366082, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3231203125, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.581227569, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3231203125, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.581227569, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4872647008, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4433243834, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3231203125, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.581227569, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3665134361, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6118771029, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3665134361, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6118771029, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3556254906, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6110639215, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3556254906, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6110639215, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3485799123, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6090575372, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3587000421, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5554477618, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2559035608, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5275904014, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.4085639059, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.588762387, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3485799123, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6090575372, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3485799123, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6090575372, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.4100134571, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5856608401, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.373921491, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5833802647, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2498780785, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5493430788, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1709832369, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5216877938, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3527295713, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6062826429, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4261228357, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.7185121839, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.2799331152, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.207814497, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.2595865729, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.5698163692, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4015773328, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.7133166401, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4625957989, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.7341375357, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.291536923, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.5622408942, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.691790174, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.8479928839, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.2900469565, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4625957989, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.7494665345, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.691790174, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.8479928839, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.691790174, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.8479928839, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.2615311775, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.5490659904, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1772984226, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.5199388279, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.2314157038, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.5938624588, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2169036581, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.550222184, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2311466382, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5786592585, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2371332025, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5552566234, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2371332025, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5552566234, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1998573974, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5400439571, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2265672091, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5533147878, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2330781491, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5966212933, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.328251853, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.6453010665, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.2124551209, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3075261697, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.605145246, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3104414356, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.6413164971, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3104414356, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.6368374224, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2080315523, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.548345143, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2311466382, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5814841211, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2265672091, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5465750237, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2445665611, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6299344655, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3060368951, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6736142285, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2445665611, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6299344655, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2445665611, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6299344655, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3423591962, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6570214418, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4798631518, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3353865118, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6803949683, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.6888365053, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.8656273481, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6195872176, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2445665611, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6299344655, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3060368951, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6736142285, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3423591962, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6570214418, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2281399714, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6211104269, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4696598006, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2445665611, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6299344655, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4530777804, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6935397253, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4530777804, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6935397253, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.5695988433, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.7516103468, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.5695988433, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.7516103468, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.5695988433, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.7516103468, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4719458928, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6691100412, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4338561264, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6652156431, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.8492326636, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.9027320256, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.5695988433, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.7516103468, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.8522456714, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.9096914044, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.8492326636, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.9027320256, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.8492326636, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.9027320256, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4085639059, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6786065713, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.3061402336, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5870676308, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2281399714, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6211104269, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.5072784644, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7361065922, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.5072784644, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7361065922, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.6004981752, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7667541011, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.6004981752, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7667541011, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.5072784644, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7361065922, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.7196315267, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.8835331637, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1815358071, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.5527491413, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.7196315267, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.8835331637, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.6289868867, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7818060345, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.7196315267, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.8835331637, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.7196315267, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.8835331637, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.5072784644, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7361065922, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.6026286935, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.8385943307, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4807711312, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.705252762, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4451075766, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.6955301379, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1624355753, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5090396684, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.3075261697, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5976254558, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1508336427, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5008630256, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1508336427, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5008630256, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.3622755744, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6470050798, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.4246163318, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.658875652, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2927057122, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5325023222, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.4550680331, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.7117510257, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.4490332324, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.7473828748, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.4194685158, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6664000695, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.4938015542, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.7820348786, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.3226386416, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6368573349, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1712473045, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5194487191, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1285890288, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3547790816, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.3942058093, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6316031412, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.5465526716, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.8012679277, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.5465526716, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.8012679277, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1771210219, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4606490637, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1771210219, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4606490637, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.546149954, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7983571334, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.4818114945, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7046532915, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4676203688, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.4818114945, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7046532915, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2284805641, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5972946651, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.4818114945, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7046532915, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.4818114945, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7046532915, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.4818114945, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7046532915, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2666060348, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.6007386268, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.1197070057, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2335769717, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5582260843, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.395208181, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2436378319, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3631474834, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.7016516454, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3631474834, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.7016516454, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.4335364472, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.6966914158, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.6096687386, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.7379288909, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1577454598, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5109149385, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3917444023, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.6762795188, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2436378319, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.4526810222, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.7303764654, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.439316037, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.732670825, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.4376912752, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.7001859044, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2974295351, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.6260896463, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.1644914967, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.533709755, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2925712721, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5502827902, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.6349495142, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.7749613595, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.6349495142, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.7749613595, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.6349495142, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.7749613595, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3797302349, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3902414128, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.2696309579, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.5695988433, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.7516103468, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.5695988433, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.7516103468, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.4598036016, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.62564013, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.4338561264, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.6552557413, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.4811256401, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.6745199185, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2503023845, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5179835315, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3208446635, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2206312064, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5852924591, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.310088227, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.310088227, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3117821952, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3117821952, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1673872929, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3836374069, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2936418376, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.26710324, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1673872929, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4506667273, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1673872929, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4506667273, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1673872929, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4506667273, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1673872929, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4506667273, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1673872929, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4506667273, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3114749712, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3180237107, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.310088227, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1663524962, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5330423529, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.224188059, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5978847447, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3500905496, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1378592993, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3954726083, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2680165156, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5455672444, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2537619201, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.6052149632, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3631421561, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.5465526716, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.8012679277, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.1882407281, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.3086172473, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.6217822674, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.3086172473, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.6217822674, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.3086172473, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.6217822674, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.3423591962, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.6803639512, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3653916977, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.3411488281, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.6740035137, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2281399714, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5664428061, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1992049404, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.61420972, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2335769717, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6610479564, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2335769717, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6610479564, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2337492056, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6381858968, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1946812478, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5932036831, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1990581597, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5425407306, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.5401725899, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.749744648, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6211104269, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2202940663, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6375628454, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.6026286935, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.8385943307, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.6026286935, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.8385943307, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2201224845, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6473444873, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1373727917, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4278566739, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1792334464, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.521168333, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2894318256, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5795851745, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.6004981752, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.7644556249, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2894318256, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5795851745, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2894318256, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5795851745, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2677353447, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5695294118, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.5420890779, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.7219273458, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1582128589, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4886015918, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.5072784644, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.7342525134, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1779392575, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5497069221, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.5465526716, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.8012679277, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.5679161104, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.756473329, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.5679161104, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.756473329, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1712473045, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5194487191, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.2567770437, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3845708951, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.6582292681, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1854382921, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5292705881, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.1410752643, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1862334347, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.534851613, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1862334347, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.534851613, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.4264370483, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.6730449758, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.4252502464, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.6774296788, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1857151351, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5098093454, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.4264370483, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.6730449758, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.1249700425, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.4252502464, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.6803639512, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2864868286, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5435462417, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.4252502464, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.6774296788, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1854382921, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5283005434, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2031374712, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.539263208, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1862334347, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.534851613, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4301823405, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.2491498971, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4320304661, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4320304661, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4301823405, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3240220869, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5364140652, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4176833511, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.417865137, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4301823405, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4084622939, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3303277212, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5637799127, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3303277212, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5637799127, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4301823405, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3305712968, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5669225665, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4301823405, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.4790714251, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.6938678729, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.6004981752, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.7697646565, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.4807711312, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.7084427047, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.4807711312, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.7084427047, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.5420890779, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.7268331816, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.5420890779, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.7268331816, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.4186091893, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.6654623052, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.6004981752, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.7697646565, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.6004981752, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.7697646565, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.6004981752, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.7697646565, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.6004981752, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.7697646565, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.6004981752, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.7697646565, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.4186091893, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.6654623052, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.4790714251, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.7010793196, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.5420890779, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.7268331816, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.6526460175, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.8267638445, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.8522456714, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.9096914044, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.8522456714, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.9096914044, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.8522456714, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.9096914044, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.6912804408, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.8416888527, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.6912804408, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.8416888527, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.3025029866, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.6057244918, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.8492326636, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.9027320256, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.8522456714, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.9096914044, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.8522456714, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.9096914044, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.8492326636, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.9027320256, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.8492326636, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.9027320256, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2704091954, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.6207272323, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.3386854986, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.6044135819, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.4741000223, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.7663314, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2974410143, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3004205427, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.301427047, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.301427047, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3334615788, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3018990564, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2688025406, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2994207472, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2982195618, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.3050638713, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5082087403, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.301427047, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.301427047, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3444107903, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2773273497, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2994207472, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.215553788, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4883739046, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.2284789347, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1512514933, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3515865993, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1512514933, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3515865993, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.291536923, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.5353956213, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.4091031034, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6380312874, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.5650247639, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.7341016751, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.450478099, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6386322493, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1813423032, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4592771215, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.450478099, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6386322493, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.6236526727, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.7064310568, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.4091031034, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6380312874, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3313273938, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.2124108819, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2151123896, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.489675384, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1854382921, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.53544824, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1895162957, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5515559648, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.186096212, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.543850457, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.186096212, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.543850457, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1903289244, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5194565258, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1843742795, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5211412955, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1810719787, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5336233775, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.5489587651, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.7425459639, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3365047447, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5791325288, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1843742795, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5211412955, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3365047447, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5791325288, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3365047447, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5791325288, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1507167626, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5080729258, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1459860809, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4458625803, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.186096212, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.543850457, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2201224845, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.6156007392, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.2581180322, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.3118687902, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.6488151565, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.3118687902, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.6488151565, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.4454357881, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.7492834759, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1992049404, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.61420972, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.3025029866, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.6286065042, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.4818114945, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.7675828789, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.2003129584, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.5465526716, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.8012679277, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.5465526716, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.8012679277, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.5465526716, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.8012679277, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1750913104, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4886834176, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1557396419, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3372949203, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2289493933, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.6048598348, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1986505401, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6164064592, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.4741000223, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.7538467008, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1285890288, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4430417829, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3283378949, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.4741000223, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.7538467008, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.4741000223, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.7538467008, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1897992267, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.58491121, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.5718109192, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.798422026, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.6312184805, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.844542217, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2111187176, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6020583416, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.4741000223, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6947687298, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.4741000223, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6947687298, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4699250948, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.2534837514, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.4741000223, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.7538467008, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1872867463, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.5182121493, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.1760120338, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1625303068, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3157594206, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1625303068, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3157594206, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.2103054806, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1449563956, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.2909086707, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.0921413422, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.5091224919, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.7202697993, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.2589008707, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.4063022828, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.6789996206, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.3957399456, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.6505957914, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.3603962611, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.5998911327, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.4144302433, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.6439781798, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.1121721904, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2757185986, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.5218771219, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3984098807, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6360169585, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.4174441729, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6692136096, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3984098807, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6360169585, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3984098807, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6360169585, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3981163195, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6320908835, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.4174441729, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6692136096, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.4441961115, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.7565542719, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.4174441729, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6692136096, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1800330192, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.5051819537, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.4174441729, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6706681341, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3981163195, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6320908835, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3984098807, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6360169585, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.4186091893, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6649304721, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.1783787546, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3984098807, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6360169585, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.4557376863, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.4794224895, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2744128101, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2744128101, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2989848791, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2556170391, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3292741529, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.4022000981, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.6018817451, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.2978808648, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.5140749054, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.2284805641, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.5921402782, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.2151123896, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.5217348733, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.30376137, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.5156956618, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3377499269, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1513630224, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3293749259, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1887952177, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.4618333674, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.3483155023, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.6924946724, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.2962368635, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.229077818, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.229077818, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1196655751, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.291413988, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1402577516, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3031509137, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1408591642, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.2507690301, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.4814564802, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.7621649609, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.691790174, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.8479928839, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.3088448141, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.7035462512, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.4186091893, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.6393114196, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.5465526716, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.8012679277, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.180975397, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1185666012, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3311682798, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.3164257178, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.5851860325, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1946452196, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5838790967, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1946452196, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5838790967, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4797543511, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.7571314915, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4797543511, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.7571314915, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1747094296, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5403400891, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1926847964, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5436964587, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1946452196, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5763410052, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.3060368951, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6498981441, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1946452196, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5838790967, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1946452196, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5763410052, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1946452196, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5838790967, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1946452196, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5838790967, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1747094296, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5818814757, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2434330428, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6275577931, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2857196256, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6431872581, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4302123694, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7142896582, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4216890914, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.6885217194, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4216890914, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.6885217194, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4216890914, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.6885217194, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.3083012996, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.658937639, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.339038739, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.674343392, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.3016672853, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.6331697021, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.6255340042, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.8724783049, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.5351607208, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7900844096, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2917630084, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.6143650112, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.5014756678, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7958858212, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.5014756678, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7958858212, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.3825188992, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7407084022, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2409084436, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.546885287, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.6255340042, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.8724783049, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4481489512, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.7745649676, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3236579503, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6509517796, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4899456142, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.7411155087, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4899456142, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.7411155087, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3236579503, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6509517796, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4896430867, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.7638521786, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4899456142, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.7411155087, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3236579503, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6509517796, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3236579503, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6509517796, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4899456142, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.7411155087, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4899456142, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.7411155087, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3236579503, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6509517796, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3236579503, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6509517796, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3236579503, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6509517796, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3851341467, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.700571373, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3954512194, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6963801389, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.3347189874, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6644203375, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.5088645485, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6991726442, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.168422147, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5314740727, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.3841606547, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.7278436878, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2284549324, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5849968911, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.3841606547, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.7278436878, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1883009511, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5190727766, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.538368094, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.7860964064, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.5088645485, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6991726442, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.5088645485, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6991726442, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.3878561122, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6673259968, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.4547900039, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6556658101, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.3675667566, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5884916014, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1633194828, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3506501982, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.8056920633, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.8391519966, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.429848247, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.7369844405, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.4899456142, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.8020845126, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.2308087289, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5837900289, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5110827761, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.429848247, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.7369844405, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.429848247, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.7369844405, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.2757185986, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5884245636, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.5950922113, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.794521228, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.483123361, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.7122562458, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3675667566, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5700185305, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.4301138301, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.7140577175, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.429848247, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.7369844405, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1872867463, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5160823887, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3843363396, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.429848247, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.7369844405, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.4896430867, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.7719180937, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.4481489512, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.7745649676, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4211512495, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.688952229, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.538368094, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.7860964064, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.3868757399, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6607831958, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.3868757399, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6607831958, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4251436508, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6674242019, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.538368094, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.7860964064, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4803501445, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.7417101158, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.538368094, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.7860964064, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4803501445, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.7417101158, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4211512495, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6938674571, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.538368094, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.7860964064, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.413689545, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6745746195, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4211512495, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.688952229, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4184379522, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6316283877, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4803501445, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.7417101158, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2404786079, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5819897904, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2404786079, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5819897904, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2404786079, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5819897904, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2404786079, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5819897904, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2404786079, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5819897904, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2404786079, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5819897904, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3851341467, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.700571373, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2404786079, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5819897904, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2404786079, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5819897904, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2404786079, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5819897904, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2404786079, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5819897904, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2404786079, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5819897904, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2404786079, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5819897904, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2404786079, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5819897904, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2404786079, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5819897904, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3942058093, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.661919761, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.5124776603, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.7722874801, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.5037141289, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.7451862558, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.5037141289, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.7451862558, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3291598889, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6085546681, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2355187821, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3575980448, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.6173766801, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.8573900401, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.6173766801, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.8573900401, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.6173766801, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.8573900401, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.6173766801, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.8573900401, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.6173766801, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.8573900401, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.4481489512, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.7994721822, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3470839302, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.4845766088, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.7138566289, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5582775803, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5582775803, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5582775803, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5582775803, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5582775803, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4481489512, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.8268199262, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.3915926973, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.7803080345, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2243657166, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6116696997, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5512324462, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2243657166, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6116696997, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5582775803, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5582775803, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5582775803, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2242387051, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6366515194, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5582775803, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.5967384019, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.8544348081, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4881010345, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7317734492, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4881010345, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7317734492, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4881010345, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7317734492, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4896430867, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7638521786, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4881010345, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7317734492, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4881010345, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7317734492, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4881010345, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7317734492, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4881010345, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7317734492, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4881010345, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7317734492, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2516966959, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.618049194, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.5967384019, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.8544348081, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.291702053, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6498499528, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.291702053, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6498499528, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.428494509, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.7211812033, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.428494509, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.7211812033, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.291702053, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6498499528, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.428494509, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.7246227738, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2859229126, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6102727682, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.291702053, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6498499528, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.291702053, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6498499528, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2748202507, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.581036396, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2857196256, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6934562446, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5432206405, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3236579503, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7121135617, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.178551493, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4966305185, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2341812326, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5587864404, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.4899456142, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.8020845126, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.4337367532, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7025336737, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3680297771, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.429848247, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7369844405, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.429848247, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7369844405, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.429848247, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7395804946, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2082605835, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5799650986, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.429848247, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7395804946, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.436648082, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2944673105, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4554141324, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3236579503, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7121135617, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2201224845, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.6169942316, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1881846806, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5492529967, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1881846806, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5492529967, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2061735051, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5529730302, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2164431164, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5920345924, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2575547267, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.7079787463, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2575547267, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.7217376193, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2575547267, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.7217376193, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2201224845, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.6174396094, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3142765375, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3060368951, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.7004749901, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3581864018, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.7236278104, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3581864018, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.7236278104, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4403619035, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4403619035, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4348541835, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.2460917007, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.227527483, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4686711015, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3581864018, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.7236278104, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3581864018, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.7236278104, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3581864018, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.7236278104, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3581864018, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.7236278104, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2917591431, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.647761546, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1779392575, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5258943316, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.24939082, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3581864018, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.7236278104, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.317716748, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.6550628377, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4017666121, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.1264835191, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3806304276, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3806304276, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.474140198, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4288827687, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4655976516, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.568744898, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2908402945, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5817930307, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.3800213083, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5676463425, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.275874769, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5801799656, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2111187176, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5359756702, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2100190633, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5151695082, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.2543881727, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3099293757, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2604066819, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.646121465, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.3766019021, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.7318674194, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.3680088263, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.7348407723, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.3680088263, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.7348407723, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2039051468, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6747066999, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.4899456142, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.8131513745, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.3407563026, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.7443887915, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.322821388, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.6700420357, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.4899456142, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.8131513745, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.4909136024, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.8295116386, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.3766019021, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.7318674194, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.483123361, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.7807505268, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1926847964, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5168612893, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5084550791, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1832567181, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.572734615, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.428494509, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.7199991365, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2821801682, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.6827049751, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.428494509, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.7246227738, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2859229126, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.6102727682, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3171094709, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.7045234516, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2046592066, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5835189338, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.3060368951, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.6834837189, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.291702053, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.6498499528, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.4797543511, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.7550938398, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2031374712, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5506087731, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2031374712, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5506087731, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2046592066, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5835189338, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.4896430867, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.7815961724, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2046592066, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5835189338, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.3763693611, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.6360504216, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1946452196, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5760406199, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1946452196, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5760406199, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.291702053, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.6498499528, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1472821272, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4857415857, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1973212456, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4151043049, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1973212456, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4151043049, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3733543476, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.538395941, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3733543476, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.538395941, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2076357803, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4603593439, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3610544299, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.491251159, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3733543476, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.538395941, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3610544299, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.491251159, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1973212456, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4151043049, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3610544299, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.491251159, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3610544299, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.491251159, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1973212456, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4151043049, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1973212456, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4151043049, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3389148751, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5365882255, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3733543476, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.538395941, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.428494509, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.716402644, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.428494509, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.716402644, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.3346449427, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.634420606, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2397212592, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5848344754, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.673464842, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.7694606959, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.5397323594, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.7889494278, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.4803501445, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.6901644027, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.8578928093, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.9422733087, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.4929664395, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.6587225865, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.538368094, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.7860964064, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.538368094, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.7860964064, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.4424442662, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.6752890128, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.234878114, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3593781657, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.538368094, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.7973233906, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.3226386416, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5322085777, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.3004191523, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.511038167, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2857196256, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5009118095, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2857196256, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5009118095, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2397212592, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4870782751, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.3004191523, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.511038167, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2397212592, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.51111621, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2857196256, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5009118095, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.3004191523, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.511038167, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.3004191523, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.511038167, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.3004191523, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.511038167, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2857196256, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5009118095, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2397212592, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4848369353, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3677323079, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.227386123, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4745485866, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4245201693, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.4803501445, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.7417101158, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4614951112, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4614951112, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4848137281, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.3878561122, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6213964982, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2260861492, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.5233340279, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.538368094, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.7860964064, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.3416198047, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6421557564, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.3878561122, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6213964982, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.3878561122, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6213964982, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.3878561122, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.6213964982, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4713477012, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3342559214, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.3851341467, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.700571373, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3865584077, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.7076640193, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3865584077, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.7076640193, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3239321194, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.6439540126, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3239321194, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.6439540126, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3865584077, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.7076640193, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3865584077, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.7076640193, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3865584077, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.7076640193, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.5183282721, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.8243678354, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3865584077, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.7076640193, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3865584077, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.7076640193, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3865584077, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.7076640193, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3865584077, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.7076640193, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.264489468, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.6377622807, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1954721569, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5978847581, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.5183282721, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.8243678354, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2157614636, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.5945881911, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.3236579503, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.7121135617, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3753221629, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3753221629, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1926847964, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.5479565965, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2445665611, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.6506028605, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3683270402, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2445665611, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.6506028605, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2445665611, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.6506028605, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2445665611, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.6532234058, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2445665611, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.6532234058, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1926847964, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.5505445891, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3765285488, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3567823943, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2157614636, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.5945881911, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2445665611, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6506028605, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2397212592, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6266330371, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2998634479, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4724747577, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3114222098, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.5393731665, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.4219577706, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.712860367, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.4219577706, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.712860367, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.4219577706, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.712860367, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.4219577706, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.712860367, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.4219577706, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.712860367, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.4219577706, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.707627182, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.4219577706, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.707627182, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.4219577706, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.707627182, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3589120627, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.5425514103, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1941547274, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4150899797, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2397212592, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6266330371, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.439472155, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2039051468, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.6152907875, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4030533404, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4030533404, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3490251488, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1483234281, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3321903107, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.1671237023, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.4899456142, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.8020827134, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.3954512194, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.6822216627, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2031374712, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.563492867, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.3482207362, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.5822525754, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4176359458, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.1738943457, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2423357235, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.5561045459, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.2165768465, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.545374294, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.159290504, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.5414849269, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.257395694, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.6452211052, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.4909101855, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.2620612021, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.5135749479, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.2620612021, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.5135749479, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2002810762, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3719830027, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3137810587, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.3956955502, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.7071407149, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.3348517042, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.6039857021, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.2861555645, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.629918289, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.3346449427, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.5983196806, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.3346449427, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.5983196806, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2851106499, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1896152664, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.3348517042, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.6474532636, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.225654013, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4590213069, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.197469407, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.1754193437, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.178567602, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.184238465, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.1845823368, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.1774601134, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.538368094, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.7860964064, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.4787974949, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.7133324771, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.2031374712, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4583712037, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.399367423, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3981749823, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.2404315522, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4283144598, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.1641956652, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.2615311775, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.5508394512, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.103165898, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3117209571, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.158286605, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3448714241, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.1914846466, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.2137430035, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.0303722482, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.069215791, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.2170093015, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0425754183, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.0517368896, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.3063547989, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5275640293, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2734283775, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5252214121, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1020384657, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3338115368, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1685643537, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3692644964, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2811075155, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5498581092, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0456369321, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.2616350227, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0149357589, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.0810610775, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0443048673, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.2080697434, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0963294095, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3503787449, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0886097347, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.317800436, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0348634322, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.1089893663, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0418110563, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.1263106239, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.0591853085, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0469519414, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2737524838, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0660966747, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2619720934, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2281521745, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4897338475, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1507980396, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4306039129, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.143845919, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3069337163, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2288990189, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4893390144, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2149649942, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4621452071, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0429472468, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2682743438, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0096249742, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.0731825569, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0434204746, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2884095691, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0510978078, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.274537215, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1907438007, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.405665851, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.0110997268, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.0110997268, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.2003172673, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0484688544, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.2058585557, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.2518167303, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2802085844, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4608753441, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1866863138, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4241639401, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2048583359, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4687358059, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1924813832, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3799051443, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2191271005, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4602679886, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.2346058703, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.0125273573, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.2731486445, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1497462775, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.328844008, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2238148768, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.52493701, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.2284908571, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.2284908571, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.2891210904, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0569456532, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.2987097798, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.296584784, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2227417005, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4532692581, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2267034081, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5112287501, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2144604484, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4889405222, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2100117369, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4234939311, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1819297585, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4599679269, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0240192783, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.2257355657, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.006232911, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.0631716867, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0693838888, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3541078046, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1312294598, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3219448107, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1066668272, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3346290149, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.0260011372, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0354718138, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.2123055601, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.0415150576, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0290204019, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.1482911337, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1036775249, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.2702781181, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2574763992, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4616305811, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2142946982, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.484261245, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1218936373, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3759566083, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1892697158, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4931453714, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.129389671, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4720138889, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0218136876, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.1715150637, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0046635316, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.072625336, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0374013003, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.2739588122, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0985948811, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2593923911, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2019894892, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3485822104, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0402793442, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2381051263, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0688899279, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2874483621, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1090055907, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2863243515, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0658474433, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3081739317, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2856210698, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4749518447, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2500514007, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4683806074, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1631196073, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3502730667, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2128683656, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4505523201, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2213838544, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.487123838, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0213957216, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.1902977181, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0311262012, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.0159701445, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0692984783, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3018519404, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0565852318, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.2754316847, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2266948695, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4484451942, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.0805429873, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.214785954, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.0115605955, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1527216185, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3256028392, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.2588416866, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2861961627, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5098631492, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2243415229, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4627772335, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0736808908, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4145261311, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1789284639, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4708819562, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1712189785, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4638766967, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0584747355, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3024184964, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0123705378, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.0666032113, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0983109394, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.332038665, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1118711613, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3088693307, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0991600948, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3032928217, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.2200119658, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0509575856, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.221568509, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.0945369837, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0042252851, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.0861677526, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.2894688066, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.2668026105, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4519949729, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1767006175, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3924531036, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1995980199, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4244503391, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.182163624, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.365248326, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1661921872, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3683990147, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.1132241561, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.0831928796, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0838367669, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.285532969, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0081047737, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.0765130065, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0947870559, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.332932324, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0202507342, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.1835106225, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0352454709, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.1574417443, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1197620936, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.2700475913, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.0583563868, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.2603466066, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1874040134, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4759508032, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1852976304, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4741269561, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0914255554, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.3137170777, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1490232165, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4374583572, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.160001999, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.3869887663, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.2727622868, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.005606295, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.0666224509, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.1275223683, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1079317537, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.2966061781, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1405710589, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3028381427, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0252094156, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.1448020883, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0233208431, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.1414772143, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0047636231, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.0748592801, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.0262417467, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0498147751, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3099723998, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.2624276421, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4883161005, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.2697134918, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4954790401, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1168960024, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.382583012, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1980953584, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4475393504, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1616527688, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4808720402, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0437677394, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.2439168896, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0047185573, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.0801930435, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0561465399, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.2648532379, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1235182482, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3906003942, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1363531958, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.285043283, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.0220842517, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.0220842517, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0512722229, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.2192562967, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0073271669, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.0988123964, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1240384045, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3036786152, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.273072085, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4904647237, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2733762612, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5386988476, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2036219587, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4504603916, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2092735109, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4123228453, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2451360144, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.508428521, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0588529545, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.2979167122, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.006488743, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.0566797332, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0420931384, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.2691340677, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0473166675, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2637166055, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0607008885, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2584364365, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2290266995, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.1914995421, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.064676465, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.237464716, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0582139914, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2556606248, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0610530907, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3130095936, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2135664969, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4243725762, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1875512348, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4299642052, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0567548917, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3098329822, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1445983407, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4652483976, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1652457579, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4729546491, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.0654404234, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0564177217, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.1470714641, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0505775644, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2645559846, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1334687879, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3080913467, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1054433514, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.2840946642, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0607157585, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.2149299083, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0187785885, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.1394190482, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0056498244, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.0938459963, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0425754183, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.0517943191, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0480257139, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.2428610297, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2635610838, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4764002973, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2815971367, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5252125986, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1738582449, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4016171441, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1612067625, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3934823211, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.23217334, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4674701274, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.0636777092, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0061022531, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.0861449065, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0505279112, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.2524478809, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0598904672, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.2852233544, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1276861358, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3279857505, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.106540946, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0455895279, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.2502391728, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.0591528553, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0105704997, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.1100673444, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0948600032, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3563185492, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2529913063, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.5047314299, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1915104466, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4810197054, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1572052717, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4715103006, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1853793533, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4783932142, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2049970131, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4818709113, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.2655991688, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.2134984128, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.2720484662, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1150958266, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.2567415289, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1613698788, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3362692075, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0963090937, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.2559618634, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0792417823, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.2206258448, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0546877772, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.2495519218, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.0952757937, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0691791024, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3356486042, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2700569574, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4456029881, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.193191197, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4018622995, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2195372587, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3664303672, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1752436791, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3908643085, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.160280284, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4076009931, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0470882896, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.2519506261, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0188079928, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.0887797546, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0643784088, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.2657614115, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.099792895, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3005938292, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1323003964, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3269392904, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.1404951244, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0400339669, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.2107947844, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1158891123, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.2382700917, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0824606497, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.2456619929, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.055997729, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3184365228, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3010169295, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4860193118, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.227786487, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4462012248, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1494730177, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3093381902, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3028759029, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5604725286, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2477319247, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4193163673, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.1274094829, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0047128976, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.0689675963, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0507961674, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3159375405, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0315345429, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.19644459, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1754417668, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3246583081, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.0214301384, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.0214301384, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.0836983143, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1345807078, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3002738097, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1014523463, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3610324631, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3149975099, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4828711196, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2066923483, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3954821804, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1955903221, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4098213379, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1541796876, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3752947981, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1332678166, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3502365985, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0579512984, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2548598507, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.0413032999, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0410103561, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2740873282, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0107119071, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.0937480994, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0919930687, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.2216385417, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0118173655, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.0859545184, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0106164205, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.1084362918, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0054781817, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.1026914283, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0405996505, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.0518518764, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0893859254, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.2237243845, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2334922961, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4473828787, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2565364021, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4508053903, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1220164275, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3602457832, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1107058214, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3732245062, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1506918326, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4027702518, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.047451031, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.2751988338, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0398422901, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.090461222, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1049798505, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3553686272, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0733032385, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3393411295, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0608998726, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2933161563, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.1984290178, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2713368245, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.0843038995, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.041514055, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0528092675, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2937198065, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2743982463, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5150965594, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2413362099, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5119321954, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2024418415, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3564333494, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2674824194, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4950459975, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1712189785, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4511162476, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.0979617281, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.010814656, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.0896887156, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2679540691, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1130748559, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.305973853, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1439182616, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3239832814, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.1377491334, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0700055493, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.2193270198, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1002207815, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.2543427312, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0487016069, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.2290700852, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1045073168, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3739493975, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.219732521, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4151239791, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1911102136, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4171914075, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1599102698, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3236465325, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1668854639, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4201032138, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2384674586, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4770811353, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.04614982, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.2712671882, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.0513525446, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1081824845, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3258308765, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0653324229, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.2979115054, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1002795509, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3650503322, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0344468041, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.2016040236, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.2378472129, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.0203182774, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0866184263, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.2474248849, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.0455183602, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2398899448, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4539938567, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2021755466, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4899248083, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.128534435, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.378165641, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2009118875, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4869109445, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.245519933, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4695982872, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0444778924, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3119344119, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0051763115, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.0674000282, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.2452462471, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1434671524, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.2981447907, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1599866587, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3568133322, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.0860048847, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.1193385531, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.0753458701, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0460601148, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.050779728, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0441548949, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.050779728, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2916500734, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5172529356, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1907614927, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4483545139, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2402463216, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4371716158, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2250808927, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4850615114, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1518847562, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4050868632, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.0695131216, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.1147291388, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0484266907, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.2491388629, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.2561794438, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3141794893, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.1786034621, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.219706802, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0482517074, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.2469647405, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0188016877, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.0762075915, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.0352971252, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1810420276, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4087926657, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1393212733, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3737850641, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1307706549, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3664151599, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0984296906, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3288790321, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0968035845, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3901340721, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.2599817969, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0043338295, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.0866871651, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0826692156, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.2792157437, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.0260644718, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2021979459, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4267163836, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0292482903, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.1718027364, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0476686206, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.2043794633, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.0333632833, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.1957772365, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0419638675, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.0516224122, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3080928418, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.521203636, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.246503534, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4563344162, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1404420507, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3871221051, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2718214516, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5260701844, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2349880762, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4876552343, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.144160887, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0191292829, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.0771102798, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.095797182, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.2903102744, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1485710335, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.2912399572, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1655878456, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4099467658, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0178653211, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.1312157781, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0548969121, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.2349479309, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.2243243411, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.0727546786, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1461429566, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3552926382, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1949241563, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3964264383, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2096494314, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4676462124, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1406721418, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3683127018, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2615379682, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4670896512, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1643287178, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3743841843, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0436714032, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.2591903536, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0098375035, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.0738163457, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0403934833, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.2660562052, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.1762631528, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3402055672, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.093376234, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.2555179847, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0413018965, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.1738508875, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0383901088, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.2122934293, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0847450577, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.2538320173, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0446034445, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.0509460551, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0557104213, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.2342703476, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.3065894951, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.5157122184, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.3193100501, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.516229686, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.1795747407, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3714895661, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.178788465, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4805877836, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.1604142113, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4821009867, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0253491429, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.1947459822, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0218884643, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.0688019442, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0740309998, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.2530589697, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.0287757396, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1188922611, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2723958945, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0597343957, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2091057996, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0313361855, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.1568404935, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0103535779, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.137434861, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0869662189, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2942577141, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1409492798, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3211348684, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1913921001, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3999036632, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1616610225, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3131370146, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1483400534, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3650996904, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1973045428, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.406023375, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2090819521, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4247713769, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.0634917625, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.0664319693, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0896838936, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2606554809, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0550893151, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.2517305147, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1101341452, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.2718590268, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.2171221595, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.2399710397, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0543849763, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.2248303115, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.0146584245, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0737286333, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3076094266, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2277105248, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3945218249, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1849339578, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4386240114, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2035242833, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4163814361, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1520832336, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3073898582, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2398212278, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.43125723, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.1238816671, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.0019267823, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.2729231212, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1416008317, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4208681078, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.158735027, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.371630162, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0322523474, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.1866934109, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.2212361705, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.1324277813, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.0370694586, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.1071484624, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.2371273413, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4737847575, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.2092398642, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.49694188, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.2221834521, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5319675596, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.2466031325, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4750802403, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.2302979641, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.495072574, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0357371651, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.2636286371, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0088084825, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.0817237537, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0278553148, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.2743064672, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0735396847, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3230969898, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1046814649, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3592910044, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.2108920708, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.0886246137, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0636134095, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.2360613388, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0349628947, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.0833394775, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.2642890053, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2009233548, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4134068926, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1567782617, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3771851946, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0559239605, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.194570149, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2336503952, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4255679123, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2192750674, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4315395376, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.1373600644, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.0063131313, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3270101704, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1544845218, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3359460432, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1283209434, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3205905925, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.1296377204, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0643152071, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.2486934518, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0513717905, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.2179007768, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0483983086, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.164469708, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.1688821793, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1556988827, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3716955853, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2140902773, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4268434108, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1752646162, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3887795637, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2084320046, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4218737616, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2244110812, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4354495413, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.0925065499, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.0604106676, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0497892159, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.2697504713, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1357565806, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.2864016238, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1121544277, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3103754668, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.1098852828, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.1047151755, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0822696915, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.1569688569, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.0519676719, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.2165364343, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2092735109, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3903841357, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2034555666, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3922452261, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1872830229, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3677267744, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.139635594, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3585616231, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.2089993825, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4145758839, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0419105676, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.2747808393, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.0784631911, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1161358149, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.2960371404, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0872069809, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3394300387, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1018074137, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3572856396, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0619429596, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2317557084, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0351761217, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.1716149092, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.0713051265, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0583085961, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2475028907, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0855743103, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3075931534, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.2648534428, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4992683394, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.197568112, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4789887224, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1022601551, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4059787886, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.177706864, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4814065752, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1659966019, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4490603861, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2265283804, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0600444334, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2456391015, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0439808547, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2975413849, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0754178467, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2491006352, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.069287831, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2822280485, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0179012416, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1967518753, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0320831755, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1187504034, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0063225854, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.062962223, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0466104561, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.0512257032, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1649184592, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.254904859, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.4731974812, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.2005019818, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.359908515, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0717602059, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.298641858, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1241730096, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3444733696, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0998599842, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2895701381, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0869027177, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2881002271, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0155261784, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.0914007624, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0922545051, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2532020629, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0445055496, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.2445466887, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1528247417, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3332497403, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.0629974647, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0714205178, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.215597624, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.0546201639, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.1059992243, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.1982965798, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.2079661542, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4053550763, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0318478781, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.0169991214, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1808548946, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.362107025, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1761718207, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3491313268, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1999254993, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.342454263, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.1722961461, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.0712445709, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1936425342, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3526225099, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1171973324, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4023449435, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1341030107, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3942932268, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1162549058, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3649888938, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1162549058, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3649888938, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2423945859, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3206913232, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.4851465943, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.6051693241, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.088526818, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3583179111, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.4703961163, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.6298835481, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.5920893212, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.6925021521, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2247861386, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4434810102, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.4026159305, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5712560131, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2296660763, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3916051273, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0777132402, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.2813748455, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.1836870498, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.351911487, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5181825847, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2452267248, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.173281748, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3178268798, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.1715979984, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.1715979984, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2990226216, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4323734153, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4321864613, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5429193884, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2334787867, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4421282786, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5843055591, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4626955907, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4687264136, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1043436098, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3012789661, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1724871568, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4004356524, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4225757837, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5948022736, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1518079712, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3505288268, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.1383531711, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1634384231, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3986641525, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.3089009202, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5676965183, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.3315037522, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4681978795, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2003825042, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4389344981, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2003825042, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4389344981, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4604743092, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.6213537795, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4310453013, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5857650291, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.3082962363, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4448728848, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.431864811, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5834549494, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.431864811, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5834549494, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.3089009202, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5676965183, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.431864811, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5834549494, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1577724878, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4141338365, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.0031727701, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.431864811, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5834549494, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2387493522, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4641140867, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2221813073, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3992935625, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1464697791, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3483313798, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1464697791, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3620367958, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3194331635, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5031092446, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4060466978, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5425760821, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.2225900275, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4094746714, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5831913487, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4217112372, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5884961897, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3344224182, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4757708606, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.448290781, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5498272118, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4180999217, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5354721595, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3786410843, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.0246742426, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2190234056, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4390667168, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2305720745, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4655848022, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2653870605, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4982627379, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1095117028, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.2749574297, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1122890322, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3610235246, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2327384158, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4961897168, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.4569234875, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6188845588, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0958342736, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4027284446, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.4547912444, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5872444902, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.4036650481, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5969793476, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3488611534, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5550499651, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3188347709, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5510450101, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3280859435, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5416930398, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.0063561686, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.0382369567, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3199809704, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2049841563, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4155916631, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1516107499, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3796830006, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0932787065, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3735036942, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0932787065, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3735036942, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0775706901, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.325316121, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.3611133026, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6289392047, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2445648179, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.5331675363, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6607380946, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.263859373, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.493136819, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2216899203, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5236896612, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2722704374, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5960046549, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2779440823, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4935559299, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2071195621, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4163963688, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.0100890204, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1027994704, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3569840484, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4006636128, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.502033185, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1867971035, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.387645732, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1353358401, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3949315197, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1353488993, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3910024453, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2826204057, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5043062353, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4329476703, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.580496734, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3714562234, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3633055454, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5680915938, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3633055454, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5680915938, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2958899407, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5527117669, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4673235341, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6059276585, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4348120146, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6115466078, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1799729111, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3492017592, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.0626608371, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.365655272, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4882803186, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.1848560896, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.2181288141, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.359834606, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.2442523002, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.121373607, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3023621415, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1367498403, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3943841419, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3808654814, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4893838264, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.2245414774, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3890858187, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.517430129, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.4488802815, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5347582737, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.5676006715, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.6880701449, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.2974074485, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5121581248, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.4547912444, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5884440852, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.2043800828, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.0101628465, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.2194796, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3226457009, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.302668138, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4926594955, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2458691816, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4658595745, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.3319782561, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.3319782561, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2307308545, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4414208765, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.431864811, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5449210172, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.0158957663, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.4321864613, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5402913319, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.4488802815, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5896924236, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.4406612885, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5676112113, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.4476950425, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5932980209, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.4723213638, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6260769804, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1171973324, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.311874117, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.1483315516, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2524905159, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.3855845079, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.9025232868, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.9169897591, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.9234732619, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.9472986864, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.9709835434, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.9951728991, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.9154051169, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.9757471795, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.9154051169, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.9757471795, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.488843684, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.8291158209, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.8935248372, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.9404428602, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3461378924, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4933032319, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2103967388, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3872019296, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3541947137, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3559047315, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1787931, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.2568045428, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3282410732, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4364543653, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.37151025, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.4321864613, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5369715394, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.5492014937, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5685465223, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.6099084961, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.6580157605, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2464380579, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4278399264, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2699951685, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4217192984, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2292375927, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4513453412, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.1879604202, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1195661522, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3305337714, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3063009808, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5061964101, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3395693621, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.144945687, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2628972098, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.144945687, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2628972098, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.118230532, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2461592106, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0846356642, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.1696081888, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0918412218, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2022483081, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.4955056755, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6304896504, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.5038374192, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6024265864, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.349172668, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4946434088, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2291612345, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4192305797, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2687127529, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4315501661, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.1806752162, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.0358676701, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1039393833, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3386489806, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1677697491, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3991833623, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2255686073, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4747086049, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.089507234, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3316894207, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1501390718, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3069388977, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2364723597, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4165096947, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.3456747067, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5098918117, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.2231193155, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4067965564, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5347497636, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.3772017211, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.528124643, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4266291185, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5800596652, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.3942032669, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6371076305, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.3183355088, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5053098374, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.0578213638, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.0305017438, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1935279285, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.392586452, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.3362681996, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.553122652, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2544967446, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4480540982, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1191221548, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.2787265121, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1191221548, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.2787265121, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1866594844, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4437597553, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4644593897, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.5796009654, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.1927932675, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.5004894768, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.6103735934, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4903430689, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.5365812499, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4867027459, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.6717971788, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4173721558, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.5043502593, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4843150499, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.5578850048, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3374197535, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.0668043314, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2919280798, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4076170046, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.3228858966, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4495802767, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.331257034, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4544266148, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.193978105, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.2199026614, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.240885627, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3796021685, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.4872335402, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6075898036, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.2344087667, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.4317853842, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5396321095, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.47967645, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5540737713, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.4387483291, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5882858749, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3270207866, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2093407743, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4409531972, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0829831794, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.2573581929, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.0067692805, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.3546571364, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4911561718, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2174185304, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4000689216, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.2274490671, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1146077373, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.206370637, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1146077373, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.206370637, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.2053322383, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3692051451, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4798870805, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.1909471507, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.4946630567, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.6169269421, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.4245848005, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5212978747, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2839224283, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5447934366, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2164429824, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3963800929, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1804323992, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.280050662, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.1765752259, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.0013316837, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1619294034, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.2536107728, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1035597811, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3008852578, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1654225968, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2697583215, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.087002234, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2360294412, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0870914517, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2298185733, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.307338019, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3701729258, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4863138218, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.1727855587, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.4407883468, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5281354273, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2945667423, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3820111377, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3484819265, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5640398262, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2834052291, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3513608621, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2607117486, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3452976012, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.1805838104, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.0080371909, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0996020674, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2368009901, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2309552735, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4513778136, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.2831988282, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.1055680583, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.1053163126, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0896659226, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.1564967798, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3589732342, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4090747564, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1029034865, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.1660861683, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.457393858, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.6041597508, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.4488802815, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5304323628, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3944883435, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5955979871, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3800609413, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4952333573, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3807835188, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.529917206, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.2037157303, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.0845164802, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1919704826, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3465066145, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3064478583, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5424888572, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2187751288, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4684349995, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1385105945, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2961104285, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1385105945, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2961104285, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3001327916, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3729157998, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3688020573, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4388306821, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.1819660468, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.4298470783, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5723546698, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.4000262679, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4958139678, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3644752843, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5303078856, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.4057053535, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.512899989, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.4574297382, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5652380319, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1754880586, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3605361466, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.037882802, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1842670876, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2863266617, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1945786955, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4234025088, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1759696285, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.409890054, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2097002018, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3587926376, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2738643931, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.424851736, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1827241149, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3161007019, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.6288402959, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.7096134366, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1742198634, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3604224246, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.510477915, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.6193632914, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.4631700687, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5656836355, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.5368572661, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.6191297829, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.5246859683, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.6168947392, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.3757861732, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.5516093877, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1065368874, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3550283417, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.0075630509, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.3245592827, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.4961612244, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1122890322, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.2944127383, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.147226754, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.2884679034, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0894073036, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.2683339864, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0795871931, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.2564312712, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.2155565135, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.3623226384, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5115662303, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.1862366831, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.4478710143, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5290749755, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.4407883468, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5398405651, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.3325507241, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4074972494, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.3537239926, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4415325921, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.4284626897, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5332275837, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.0061376874, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.1738335057, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1815433909, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3244528801, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2436419423, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4803275525, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2542828012, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4695941026, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1449700554, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3443731766, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1449700554, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3443731766, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3328114847, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4458341777, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3754361563, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.517558668, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.2864399965, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.4183741456, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5788593227, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.5227583694, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.658086832, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3876366843, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4978835095, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.4302440011, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5419412911, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.3968427845, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.5690871427, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1433180486, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3550333935, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.0080178579, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0988536232, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.2922887729, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2188392829, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4686200098, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1965928456, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3439604956, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.2607825013, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.2618919103, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2181288141, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3090525767, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.3492507318, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5496225091, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.2249784741, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.4532607979, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.6057637452, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.4913251088, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.5226059543, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0775706901, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3493795476, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.3054859925, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4679798467, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1537112056, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3277135849, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2331637025, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4272786682, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.01479001, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1352102459, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.3209694091, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3232764602, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5431013661, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.5046613015, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.637796962, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1786486639, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4318546655, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1810425767, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4009339188, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.5037566723, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.688705973, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.4334785461, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.6277016493, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3830039705, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.4237613813, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.5866233346, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.5594129512, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.6536638088, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.5639943531, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.6640560919, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.6878626651, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.8027840472, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.5885017791, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.7371195244, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2572812063, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4712370054, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.0093441292, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.2507010004, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4191447532, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1995129794, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3959122807, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2032621337, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4211311972, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1296602059, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4080786466, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3249929186, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.302668138, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4321096866, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.3484636843, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4951272293, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.2749866192, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.3146587198, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4839658797, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2983588345, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4730509519, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.4096636841, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.5278686169, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2904047194, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4617994566, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.239898222, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.411144763, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1765985771, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3722080737, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.1648414046, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2118120365, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.4245081341, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2255468433, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3946833869, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.1289068007, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.1839892716, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.1586510484, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0801399249, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.1552012947, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0830820562, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.156017965, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.1153430137, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.4347773475, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.576341381, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.4417179753, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.5530863244, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.3002781435, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4842037101, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.208817295, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3442652042, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.134818788, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2007978949, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3413615261, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.1447062686, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.2566358039, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.2738379692, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4878379588, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1444027027, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3829771215, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2071380877, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2071380877, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1691287327, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4587620544, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.4569234875, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.6188845588, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2203595851, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.4955056755, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.6373668823, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.4049493948, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5523097163, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1786486639, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.4085144223, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.4333488015, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.5965589158, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.5004894768, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.6363587895, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.0062450169, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.0097435637, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3174589148, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1486070692, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.2876054438, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1667112121, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3091312551, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1619294034, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.2773561971, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.171852621, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.2956663669, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1716931386, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3193195681, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2860639863, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3809088476, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.0080761379, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.4174908454, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.532629667, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.307695001, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3660673946, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1945429094, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4056377906, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2036529001, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4327934811, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1356590733, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.283480642, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.0080957533, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.1247552881, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.2362382406, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0891712295, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3647616198, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.2045527518, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4781573576, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.2443399085, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.2022525118, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.241990611, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.430837102, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3561794559, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5928040084, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.1801664301, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.5627168455, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.6692849204, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.518456549, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.6742153914, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3390409145, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5149735242, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3074762345, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5504296088, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.4897516268, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.656493231, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.0078111767, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.0097559692, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.2635162917, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1240861632, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3652145198, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.2280725846, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0900779003, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.2403353486, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.1971628211, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.2217146309, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.3251763396, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4533778049, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.2598901307, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.4315532958, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4869755956, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.4440750606, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4901489106, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.3442087652, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.5068918436, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.3146150051, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4233526729, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1402342404, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.243775938, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.1890037708, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.0046935712, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.2331624324, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2056660017, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3332179943, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1894523533, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3443950901, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.1402739529, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.1542051915, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1006788152, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.339471961, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.5910744763, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6719182395, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.1826047865, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.4946630567, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6169269421, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.5795328348, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.6571878614, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2426376379, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4583407227, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3201886645, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4142777373, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2735838425, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4313737146, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.0078479587, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.0081154642, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1722630701, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.2929617403, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1146077373, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3630389603, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1581734376, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.2985579612, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.1799218761, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.1763189606, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.1602999169, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.1461012977, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.1171954274, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.5176576778, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.6613069296, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.6510651028, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.7441675184, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.3114855789, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3867464805, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.368818981, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4691915859, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.3580995277, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.4302234255, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.0098738411, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.046579169, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1117535423, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3298241714, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.164461102, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3379763603, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.168322547, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3417273532, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.1663768232, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2598332227, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.2543269102, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4565797935, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3487616463, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4903432663, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2337773425, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.463900136, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6066709784, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.5563610897, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.6234143353, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3203505804, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.5201747872, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1836719686, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3652875097, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.3489571331, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4539166206, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2684337672, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.1642384866, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.4097157364, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.4592265081, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0711399045, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2671857672, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1567864815, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1556051571, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1556051571, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0980286251, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1801811095, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0942924728, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1779374253, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0592866628, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1386716777, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.3961554468, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.5208357533, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0980286251, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1878238308, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1414355019, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.3460029263, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.087470156, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0925292191, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1727205518, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1506688384, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.0596357066, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2115339554, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.172815092, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4697967033, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.4102495209, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.689626048, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.072091174, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.2485455674, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.072091174, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.2485455674, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.1380164294, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.0527836624, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.1367093374, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.4951225397, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.695156541, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.5067058202, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.7186203369, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.3537581251, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.5377035719, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.0061527937, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.2738643931, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.5091945154, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.0062763757, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.0060049973, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3363699446, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.3314824344, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4714509113, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2097257149, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3958940712, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1484131243, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3702567901, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1484131243, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3702567901, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1667887222, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3815615866, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2312892591, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.429642013, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1508271374, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.39659117, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2627913769, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.476022074, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1892847543, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4916060436, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2194042939, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4343280867, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.3300025916, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5052501973, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.167728933, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3631993115, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2327184905, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4478078222, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1824401863, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3670943319, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.3377854699, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5212012299, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1743141732, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2946006717, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1247584612, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2782334073, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2102861073, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2077061257, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1413464157, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2294891986, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1022763759, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2639843034, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1032298579, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2449112248, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1760042942, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2712560799, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.212684447, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3229997134, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1475503034, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2210410894, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2491127461, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3603818787, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2555886019, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3615321421, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1659072309, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3048601436, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1008516756, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2383121505, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1754374453, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2820101696, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1511056744, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3452827307, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.3032787241, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4980421354, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1308672244, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3175036485, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1308672244, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3175036485, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1323764586, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3818322536, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1953226561, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3705900176, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1393754204, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3894719474, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1609112383, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3479090205, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1201739663, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3145128189, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1815423566, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3906877818, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1670157087, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4021286881, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1706885783, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4225990442, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1248955867, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3412708226, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.2938313992, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.157997836, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3949243938, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1250361463, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3600940511, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1278739555, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3375274254, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1362877036, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3557485349, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1362877036, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3557485349, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1318131343, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3175812088, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1057536542, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.311219701, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1187311958, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.2738621723, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.316692053, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.2662775445, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3375384369, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1463197333, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3593717322, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1486872033, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3323435432, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1180985863, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3213619214, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.0101767053, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1362877036, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3124983185, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2701175927, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4427599081, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3996254547, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4245413015, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4137283876, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3911236938, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3817455147, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3685731278, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2529968293, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4798320133, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2252434881, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4468141977, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2202248274, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4847496568, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4581393811, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2519921894, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5094822089, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4046788061, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.1593344703, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2249495262, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4760660342, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2808927299, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1432651349, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4034278533, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1190001244, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2764563186, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1190001244, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2764563186, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1382944607, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3205933835, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1081441008, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2688233391, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1311040994, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2967415176, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2495169225, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.542794239, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1835715309, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4205224654, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.165216918, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4134512022, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1236664408, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3765134278, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1493734218, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3978589591, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2808463393, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2962222, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1971903602, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3626964653, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2663224082, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4670767909, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.182941171, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4383387745, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1806102343, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4007053924, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.175046302, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3839125808, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1709246775, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4340281227, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1773054312, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.404813142, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1602717706, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3907258279, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3857801012, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3917239471, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2286041446, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4733113101, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1720067347, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3994831855, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1821474812, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4214655348, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1655485713, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4116209605, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1055322557, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.1763116501, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1773054312, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4201842845, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.2538799032, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4061799424, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.2029840717, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4273763309, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.1903260815, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.2078396213, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3829871599, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1715579786, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.389678321, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1066975938, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3168512125, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.365576402, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.0022163121, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1755819961, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4133497901, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.2431884859, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5013433181, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.2759106085, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4112997823, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1143643336, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3176453743, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1378490621, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3161105982, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3882967156, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4287492505, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1562623181, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.291871279, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1511319465, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.2834306935, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1511319465, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.2834306935, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.153253165, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.2756316952, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1536066468, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.2802368315, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.2040828288, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.2778060655, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.28517971, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.3210853624, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.2830695024, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1562623181, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.2831829304, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1536066468, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.2898716122, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1406363056, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.2453152046, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3264287329, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4166244317, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1360265255, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3002035244, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.2139709913, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3568171393, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1551566862, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3182263053, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1551566862, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3182263053, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1413464157, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.30785711, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.2166646699, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3532993718, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1461700142, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.2791654843, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1806102343, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3684591961, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.0290265664, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1565899484, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3084004707, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1616505795, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3517221063, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1645494395, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3395039485, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1762505703, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.2840831395, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.0124589603, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.2005358365, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3585550644, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2425078966, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4412765873, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.229897139, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4576466768, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.153130508, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3836419456, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.153130508, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3836419456, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2218343729, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.469051775, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2327080491, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4435738303, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1674413496, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3646163104, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1743771229, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4689350277, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1580869433, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3620582209, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1508931842, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4354703981, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3931382365, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5429286386, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2147829756, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4454092411, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1606012235, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3962176891, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.0072371553, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2223392282, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4675027108, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2835511313, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.276972506, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2136187658, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2033571258, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2258578256, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.1190636584, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.110205107, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2753348108, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3163430447, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2462954619, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2551232415, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2356239773, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2390985318, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.0062494471, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.1713179346, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.187238603, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3744699637, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3238973847, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1284866897, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3510128773, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1284866897, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3510128773, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1361658548, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3295167856, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1205331006, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3171578306, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1173534476, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.2211996191, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2575337905, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4253117788, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3043567522, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1281982504, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3651532899, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2174376922, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4131100936, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1547142813, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3797208554, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1322148042, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3008688617, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1191456217, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3639931709, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1302352098, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3260351347, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1283205561, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.2392667579, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3769302868, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1581578341, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.2990712208, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1581578341, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.2990712208, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3791177762, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3370625924, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.348481362, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3767372262, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3371166726, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3284649069, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3397876135, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1562623181, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3835008462, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1485542687, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3526199874, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.0096280076, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2024746974, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4418847146, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.2762822898, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.2494209435, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.7065161304, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.8047179188, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2353716486, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6897992635, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.664271838, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.7768492312, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.7660237942, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.8523393041, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1221286555, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3283024639, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2168828306, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4479129165, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0922567176, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.2523418211, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0917508468, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.2502292163, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1423256407, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3890910518, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2834052291, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4463699833, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1680901633, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3578360182, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3420291338, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5175802067, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.2189330439, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2479798472, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4497423075, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3144351519, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4709516979, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2557186722, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4214364635, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0997564897, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3173713993, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.1531067285, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3863552232, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5712128724, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1406259844, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3170195854, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2112174445, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3711587615, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.1729748623, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.1729748623, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1584499089, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3420386248, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.212432413, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3866454944, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1200869963, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2890949021, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2932961954, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3509216686, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1357521816, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2572585481, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2045516327, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3580560102, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2210312846, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2381424916, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.1168213031, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1296602059, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2735600297, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1094974142, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3143619843, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.120309212, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.2935108999, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.0346648674, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.0346648674, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.2136628331, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.17681988, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3160912868, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1167008545, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.2600678712, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3128510454, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4986402374, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1027375699, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3189374533, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.213093175, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3438625961, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2912425895, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.440415904, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.274106345, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4591309102, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1047180098, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3002812465, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0994331257, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.308380941, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.20416354, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3020070871, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.1931611179, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2023612696, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3258121781, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1283205561, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2209901152, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1283205561, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2209901152, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1221762491, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2260792485, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1242416606, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.1843602934, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0856863573, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2159174722, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.1809496049, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2213733761, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1445549391, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2604577257, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1335123432, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2109747878, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1535686541, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2865954536, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1258273119, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.235212285, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.1222932913, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2790886522, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3015846611, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.145800301, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.2202030567, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2387054424, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3038971866, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.1027704436, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.1124196921, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1221762491, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.2594914718, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1226659433, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.2503423204, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.117588068, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.196380369, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1226659433, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.2146038322, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1945429094, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.2850090374, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.274106345, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.318652853, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.2387054424, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3040028144, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.1722232256, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.2422343661, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.1950495147, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.1195584858, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_from", - "metric":"bleu", - "score":0.242140936, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_from", - "metric":"chrf", - "score":0.3066737552, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.3366844235, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5178614849, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1708106136, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3645499017, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1701648662, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3815871239, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1701648662, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3815871239, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1773054312, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3932130356, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1667887222, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3637613573, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.1616505795, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.3755941714, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.3999374158, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5786384525, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.319436209, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.3061191299, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.5089658824, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2566614541, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4282484209, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.3492520394, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4895757696, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.162673926, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4029875964, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.0121856802, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_from", - "metric":"bleu", - "score":0.2848759498, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_from", - "metric":"chrf", - "score":0.4793282151, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1863040568, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3913852085, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3615889762, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1474542551, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3266271798, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1474542551, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3266271798, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1307524498, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3361579715, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1623790818, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3670808373, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1275724716, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.2807962809, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.13574363, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3517512874, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.2819192243, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2577701687, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4440871284, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2088929028, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4127473132, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.1956833643, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3996176422, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.2124570425, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.3820763688, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.2066657943, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_from", - "metric":"bleu", - "score":0.247226482, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_from", - "metric":"chrf", - "score":0.4413120951, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2249502221, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4223099671, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2058881573, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4194446199, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.222084029, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4070863716, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.222084029, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4070863716, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.175046302, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4226395738, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.224697344, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.430588468, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.1146038414, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.2956164497, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2175549422, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4124786355, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2032648426, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4113882971, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2966887335, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4543969785, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.3300025916, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4884860392, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.3300025916, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4884860392, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2324568797, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4433373371, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.0737873045, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_from", - "metric":"bleu", - "score":0.2147829756, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_from", - "metric":"chrf", - "score":0.4618896398, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1383690338, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.2826680631, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1358896975, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3523239133, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1160961779, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3030210544, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1160961779, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3030210544, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1159507116, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.2361346034, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1109232564, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3045281034, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1228979883, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3280398584, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1631849581, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.2996949856, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.163979069, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3610632772, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1900096922, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4748534635, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1421433745, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.36091593, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1221762491, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.3477174082, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1227598323, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.2619861329, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.1258094133, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.2553947244, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_from", - "metric":"bleu", - "score":0.3251236519, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_from", - "metric":"chrf", - "score":0.4957568395, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.21222721, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.2775686236, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1315376613, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3028123601, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1315376613, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3119958542, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.2815763683, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1645494395, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3212878805, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.2069099661, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3685394321, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.295785178, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1340616912, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.2770773336, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.138082965, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.3721998912, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.2602720291, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1266637216, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.2850381295, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1383690338, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.308816836, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.2181762689, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_from", - "metric":"bleu", - "score":0.1609112383, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_from", - "metric":"chrf", - "score":0.2968312568, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2298797475, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4413223405, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2175549422, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4362387654, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.1858042935, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3794437279, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.1886418209, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3794437279, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.1457751612, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3555305489, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.1761368775, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3951933819, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.1318131343, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3918044047, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.3621795145, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.551454372, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2131110797, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4388024026, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2567411255, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4331602231, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.2684500838, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4949662669, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.382945316, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.5336098994, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.1360028792, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.3236348308, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.0063565537, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_from", - "metric":"bleu", - "score":0.1421938964, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_from", - "metric":"chrf", - "score":0.4229437429, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1322148042, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3123314141, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1287668952, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3034375835, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2118964985, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2551309002, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1331440297, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2603808074, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1223510768, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2316964345, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2160836611, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2219463108, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2586080895, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.1981444273, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3102637354, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3395721872, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.1331440297, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.2653676233, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.15479055, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_from", - "metric":"bleu", - "score":0.179704006, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_from", - "metric":"chrf", - "score":0.3168437607, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.2590721086, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3549586016, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1828540487, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3023902804, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1736086198, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.2743074384, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1736086198, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.2743074384, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1341063965, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.2766307218, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1300986845, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.2842871175, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1077448901, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.2061208528, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1502250211, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3291575381, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1315376613, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3012532961, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.3466123639, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.4602193169, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.166558336, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3065906312, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.1586668325, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.3074056285, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.1696945358, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.1553358687, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_from", - "metric":"bleu", - "score":0.162911928, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_from", - "metric":"chrf", - "score":0.2800592178, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3351318043, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5017887941, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.2329216409, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4807364087, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.333238591, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.333238591, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1269051898, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3450402349, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.155334391, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3666802859, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1048730309, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3411413947, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1792939676, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4629429664, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1602382805, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4268341897, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1660551995, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.4509175931, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1453056699, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3996703801, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3810271038, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5487840153, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.1580433751, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.3469496559, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.2533911498, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_from", - "metric":"bleu", - "score":0.3713354961, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_from", - "metric":"chrf", - "score":0.5550866337, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1602717706, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3978173363, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1540463229, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3934040018, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.246766761, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.246766761, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1463197333, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3917791418, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1816430579, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4299219126, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1062948022, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.2893247453, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2327080491, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4453208003, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3391544707, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2577701687, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4782520457, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.2086872196, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.4287494866, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1394842, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3744296786, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.2766362617, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.1271801603, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_from", - "metric":"bleu", - "score":0.1760042942, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_from", - "metric":"chrf", - "score":0.3699002946, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.2387386324, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1560665245, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.386769736, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0884201903, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.2702544959, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0884201903, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.2702544959, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1502250211, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3581568895, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2012788514, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4158992612, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1028131261, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.2831556428, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.1717286307, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4414945899, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.3427050698, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.256963082, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4638113965, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.3110277299, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4544814135, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2764560856, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.4775117409, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0929691776, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.29970256, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.1514798525, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_from", - "metric":"bleu", - "score":0.2108528803, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_from", - "metric":"chrf", - "score":0.449596688, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.2647482712, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1362877036, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3046429128, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.268507896, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.268507896, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0566217058, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.206635514, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.083351125, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.1757222237, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0474357178, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.1254074321, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.157997836, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3478409814, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.017418423, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1342816455, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.2947742083, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1996812739, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3882998251, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.1986162691, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.3882998251, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.2268580622, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.0908357042, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_from", - "metric":"bleu", - "score":0.0834058287, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_from", - "metric":"chrf", - "score":0.2437536104, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1269270754, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3091914499, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2933171392, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2629115376, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2637699112, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1182518861, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3091914499, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1404678995, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2962148769, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2235024225, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2812642832, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2167661288, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3338227785, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.268979816, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1161008302, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2862219875, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.2951535845, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.0533840079, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_from", - "metric":"bleu", - "score":0.1506922896, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_from", - "metric":"chrf", - "score":0.3780369017, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.1382590514, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2325663165, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.2225647445, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.0275588782, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.0275588782, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1053914097, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.0817079143, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0586191125, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1120947801, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1555770025, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.027312532, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1612982609, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.15080393, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.0275588782, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1476996786, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.0200359258, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_from", - "metric":"chrf", - "score":0.1494957761, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.0138000672, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.2727444239, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4767475273, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.2866968424, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.2283980372, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1070460489, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.2839466003, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1080439968, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.294634966, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.0232133895, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1822595523, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.4400405225, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.023406525, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1486872033, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3185175816, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.1657462416, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3990312722, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3672664653, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.2378843103, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.1744167679, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_from", - "metric":"bleu", - "score":0.110471112, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_from", - "metric":"chrf", - "score":0.3405217871, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4824454361, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7294391806, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5745954681, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7920051188, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.473743611, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7204787094, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.473743611, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7212488881, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.6012475604, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7990339789, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5825014144, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7832709524, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5293493443, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7338751119, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.593861122, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.8079474862, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.6407610564, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7997703698, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.666067774, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.8293798371, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5718247506, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7570613393, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5718247506, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7570613393, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5934447342, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.8057808261, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.6241924128, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.8031006154, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.637250211, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.8187019875, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3504650671, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3985617531, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3572514591, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4031231976, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3673594704, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3973031067, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2940872474, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.371820954, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2996868226, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3355531728, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3704616278, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4166020708, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1945002964, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2766236141, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.4317270148, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4476891052, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3186925263, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3608935627, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.4199243021, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4310330651, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3814608517, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4003026958, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3625867508, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3828423819, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.314699984, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3609768424, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2613520653, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2929743883, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3887651247, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4134287679, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.8562379115, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.9148801473, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.9878765474, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.9958930218, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.9878765474, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.9958930218, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.9878765474, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.9958930218, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.9878765474, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.9958930218, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.708662669, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.8167266342, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.9878765474, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.9958930218, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.9878765474, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.9958930218, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.6537803976, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.7742226744, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.9878765474, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.9958930218, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.9878765474, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.9958930218, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.9577952806, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.984767538, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.7382380644, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.863773877, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3831856821, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6625830409, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3560124706, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6528728847, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3155065747, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5938531598, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3172449687, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6080661572, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3535276145, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6399338911, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3290938553, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6587606187, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3489208531, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6505040272, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4202165847, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7002995338, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4142150748, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6886174347, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2979376341, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5878658443, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2737856703, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.609144179, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2737856703, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.609144179, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2831940853, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6293179947, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2060740184, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5566122985, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.376414574, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.660406351, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.6688950612, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.7856645014, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.5724622291, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6818279156, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4211686428, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5788959328, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3472652234, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5363235029, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.543980353, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6575989222, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.6910600271, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.7855543052, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3051409552, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5227460341, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.7311321553, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.8118306465, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.7618275371, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.825286078, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.5447800851, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6845859708, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.6345704535, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.7601399913, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.6515663614, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.768509508, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.5435307013, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6465767616, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2747017431, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4456826256, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4834220367, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6788626715, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3842600771, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.6030559478, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.267623232, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5440246804, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2559102159, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5013387365, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.258869207, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.501809735, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2328598164, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4660475399, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3215063503, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5479695584, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2002461106, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4509998021, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3648808361, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5811650865, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3187601848, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5884644304, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.324998939, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5532261012, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3140083019, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5436299116, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3104399268, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.539023495, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.217329685, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4683342449, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1800381353, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4276066829, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2702404891, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5059487428, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3856260937, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6500036127, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3765213224, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6469521425, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3854316215, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6356972129, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3854316215, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6356972129, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3624746661, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6011484151, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3037425321, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5893368096, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4161637851, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6576322812, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4326013853, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6609703937, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3510442823, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6071559885, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.407992699, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6592699047, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.260756525, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5605305671, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3099487893, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6006061483, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3201334027, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6222205234, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.1333978635, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.4677868984, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.2602768294, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5310567542, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3792935336, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.604683163, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4421973227, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6193429426, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2291350627, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4939257941, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2300624325, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5109587983, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4185267451, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6035836276, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4717494805, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6205798682, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3875008478, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5621267917, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4839792902, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6380327835, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.569053507, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6944016439, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4330560284, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6068335863, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3769643783, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5617832488, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4160129572, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5905243302, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3175167305, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5599612274, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1810501939, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4154005352, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.5018386916, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6673891539, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.6832136298, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7617777911, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.6638859619, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7874224591, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5298074527, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6947127142, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5298074527, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6947127142, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.6543739381, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7768522459, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.6623997922, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7735365396, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.6225849493, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7743614552, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.6699094721, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.8022876242, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.6967404588, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.8042365592, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.588648912, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7611944709, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.6561309661, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7849652413, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.6563682117, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7849957664, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5513991165, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7476990274, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2431197693, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5332455437, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5821415139, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7329539843, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4766240788, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5978297795, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4845228, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.596805047, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4376770823, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5832672216, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4376770823, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5832672216, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4494703452, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5696298539, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.5361224072, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.6206824469, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4004369616, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5499753932, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.449813089, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.6151723374, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4469067872, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.6070649357, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4295014616, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5957510679, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4772740424, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.6081867526, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4561327125, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.6079134952, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2932156666, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4784943256, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0165604899, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.1132379771, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4124136267, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5714981156, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3529111374, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6466347967, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4726941433, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7451099574, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3316233172, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6272179443, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4139457403, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6639608785, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4216321717, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6897801156, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2948270649, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6191657517, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4377505013, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6684596427, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.603601931, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7801644742, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5022206886, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7105763508, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4324907328, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6444897357, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4154129291, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.643723328, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4847783844, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6873592112, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2755378501, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6144463222, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2797994281, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5926090215, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2995846559, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5994048238, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4026333612, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6561295628, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4143449479, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.673656943, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2463870511, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5790960837, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2463870511, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5790960837, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2043019546, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5336103119, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.460215944, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.156264376, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4715421309, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7046296108, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4775743055, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7017340115, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3818762105, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6423162802, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3491792142, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6341002242, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3467761224, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6340001931, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2631288868, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.548964367, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.0017531557, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1934804829, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5498004622, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3725685851, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.694405807, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3720001389, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.7013845085, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2553027433, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6370427509, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2553027433, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6370427509, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3649036595, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6887265942, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3616219381, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.7227161818, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1853380378, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5623323442, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.4058364744, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.7590590042, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.4608790143, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.7574945544, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3349016716, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6738850346, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.4547549844, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.7890162768, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.4547549844, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.7890162768, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.4099467567, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.7134834639, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.0014100395, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3341557927, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6767920817, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4000115178, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6786441872, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4494597917, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7073438158, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2893234036, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6127615086, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2893234036, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6127615086, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3503640149, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6426566938, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4754775746, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7412539061, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4254054052, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7419806831, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.5119365924, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7671481459, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4696902393, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7315431192, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4662543919, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7058896648, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4997575473, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7306601419, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3862844443, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6747509427, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.1731432715, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5307830563, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4290760508, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6942504376, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3001925558, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4986988949, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3268845395, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5177343511, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3014338594, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4642558926, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3024007598, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4633715711, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3293368889, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4868090313, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.309054287, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5103110435, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2868006357, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4509415605, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.4592260218, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.6081527521, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3446713174, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5204675443, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3597572114, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5404525494, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3276986983, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.470178979, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3249152568, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.477688125, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.4618548402, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5927663766, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2483029971, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3968882034, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3195089197, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4896643256, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2806454735, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5180716872, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2598777183, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5891629073, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1645647767, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4128543592, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1665598655, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4124447085, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3036094747, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5533394965, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3720337795, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5959145386, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1533428946, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4257635311, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3182748866, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.6082918459, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3516027504, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.6195701585, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1429693649, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4755038138, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.4096506623, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.649236506, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.4066581265, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.6336046295, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1401694296, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4272307712, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1760794779, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4575853717, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3340339327, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.565679543, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2192609696, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4167523578, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1592287655, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.392054529, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2701435097, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4745339489, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2701435097, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4745339489, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2975272141, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5014416568, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2251933632, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4830824236, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1608238101, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4142991984, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2946154489, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.520909149, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1314079838, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3808902516, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2606567287, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4890257121, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2703464256, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4887431069, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2564158056, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4985422503, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.236221005, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4430018401, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0900128129, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.2967810564, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0709787993, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3721953236, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1047947717, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.489652006, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1061903685, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4840210376, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1821138708, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4986662704, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1821138708, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.496627096, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1667579458, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4319174283, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0804182297, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3905413317, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1067619625, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4217035289, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1137285511, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5442956479, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1040922995, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5230723703, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1383466628, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5224463124, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1260228462, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5260100533, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0982158039, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5241292206, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0755916752, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4397873567, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.0019936204, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3966243116, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4243281568, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6929325034, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.484016843, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.7080111416, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3833719966, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6131504489, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3479593282, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6085432842, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4860845406, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6654842087, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3959836986, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6372978936, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.1324340637, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5138012834, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.7611872893, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4338915749, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6814623138, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4043183357, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6726559802, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5245557812, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.7584833861, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5245557812, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.7584833861, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4089601472, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6783188537, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.0535286908, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.381954689, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6360111898, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.276430338, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5419234868, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2605601, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5367621571, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0980629789, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.3903932428, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0959650718, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.387961208, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1864224228, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4691166437, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3560731744, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5863868434, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2462844971, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5007787043, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2926638003, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5719277381, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2560601538, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5528416138, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2883192773, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5811195806, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1137999186, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4351192402, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3683865525, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.622976126, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2028908092, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5022073517, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.0020798669, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0876518186, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4198399937, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2082930999, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5532091848, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3481883244, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.6021958119, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2758130765, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.555386594, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3223396024, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5912894027, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3146657216, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5835370043, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3515801944, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.6120838595, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1613389652, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5552482282, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.4278408686, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.6882160381, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3859192215, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.658279417, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3507011049, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.6303302921, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3086175864, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.6190092441, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3576059082, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.6266553981, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1816363816, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5268292197, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1247824427, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.360678603, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2869154405, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5724031955, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3214836778, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6050096649, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3962150993, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.661579107, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3461149674, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6080288193, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3266611081, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5894586069, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2480974841, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5410362169, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2093922424, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.536274568, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.1910176196, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3448409302, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6395426496, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.348309625, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6318122441, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3480615932, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6310588996, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1329195574, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5202656846, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3310309191, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6237034632, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2076781156, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5422928733, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.0012236907, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3700647909, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6502447446, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2952766338, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.301420233, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.308431879, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.348679197, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2333206164, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2566419801, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2405665303, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2761116321, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2495236752, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2609799308, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2130826774, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2601354884, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.172301598, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2190209939, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2071210961, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2716500133, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.4013796238, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.3867568552, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.3893349932, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.3929514837, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.4198465413, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.4220024963, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.445782016, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.4413641988, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2400005785, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.267896582, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1163190656, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2557855807, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2727073772, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2405856208, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2719774363, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2305738879, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2872206315, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.1808733422, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.1808733422, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2316754904, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2711134955, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1892200388, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2384225593, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1459772707, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2327510553, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2572612647, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2938008219, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2170018433, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2425396354, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.216410352, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2441782822, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2164921332, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2412402757, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2265279671, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2764063117, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.158089056, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2097214753, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1234039753, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2044445386, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1961148618, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2607156802, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3661665378, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6186956524, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.38784545, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6551636736, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.4684056503, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6820263032, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.4684056503, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6820263032, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3634216548, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6210552995, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3600088669, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6231275718, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2357207794, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5451532107, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3883340374, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6469273692, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3907955113, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6489080989, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3691590047, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.63634035, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2492904494, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5801222491, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3438759684, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6178241857, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3567821216, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6144568171, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2423520401, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5229173241, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2561386634, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5426654213, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2968684307, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5965916756, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3635008401, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6256665663, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2789283308, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5934703247, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2931172961, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5995777718, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2058570298, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5580925589, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2182685971, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5755949065, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2198075098, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5624240513, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2484556279, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5720910327, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3148545033, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6192770324, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2970503087, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5980643974, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3293744591, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.621734126, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3296849443, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6225198705, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2701732725, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5963262713, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.0018463811, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2191909414, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5995081066, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2760129269, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4796094092, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.310949331, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4906885571, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1492411396, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3993127431, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1608791791, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4188174294, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.3297812291, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5164501196, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.3790340178, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5755612587, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1752611208, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4183562973, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.4316819878, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5878046852, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2729927321, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.477037078, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.3527260474, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5246522558, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1776418682, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4643539241, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.315014891, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5091327701, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2281330715, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4503946901, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.0304107029, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.3554259248, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.54607273, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.3609839854, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.6437289665, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.3833596038, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.6303767331, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.2787847531, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5553047982, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.2725539427, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5601834885, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.4114155282, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.6302831368, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.4935048463, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.6943423485, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1515895761, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4190363051, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.4620212794, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.6929628328, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.4134846608, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.6553595923, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.4215292636, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.6613648438, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.3860341167, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.6493990798, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.3859703894, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.6451087675, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.3627829136, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5991830268, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.0014492754, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.3088416771, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5929008789, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.5486141288, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.6319028691, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.5350553356, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.6061404962, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3896845294, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5335919787, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3316280826, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.484108334, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3812595799, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5540174, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2818356183, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4873620919, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3027621928, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4761465803, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.5487552983, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.6792265965, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.5508944416, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.6588533619, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.4935985545, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5839815052, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1959068559, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5086260671, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.5746911772, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.6684658929, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3281583484, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4266174575, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1585410271, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.2981695175, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.5077054905, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.6413587198, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1405908234, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3681067484, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1611183722, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3897870969, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0663880802, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3558829662, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0635704651, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3538942716, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0989917658, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3565436123, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1903819104, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4467804501, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.105515377, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3506843953, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1965846863, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4328743583, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1284335757, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4173634055, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1448369994, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3906065103, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.2881123155, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0845250805, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3436527523, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1488938388, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3891856763, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.000709824, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0785950789, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3479385838, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2907774922, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5054867927, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2994581307, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5652964318, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2827954146, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4985216049, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2854020995, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5032170837, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2887273871, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5546188228, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.3128156976, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5919269832, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2624046909, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5428010726, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.3728454915, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.6659031226, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.3320217594, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.6192339182, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.3024784802, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.6011904529, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.141979371, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5124141579, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.3165543225, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.6093384141, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1534684069, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4338689861, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.0016212711, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2727086653, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5856254576, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.3012954123, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.5580271496, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2170322998, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.531352232, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1910848554, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4433063858, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2055691816, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4403283744, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1156423806, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3946570546, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1296430335, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3075780604, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0450732266, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3072344834, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.4703094052, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.63131306, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.4268698427, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.6231228373, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0962617119, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4030384335, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.3040281644, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.557011361, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.3055356654, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.541441418, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0663449009, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3933989157, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.0616470534, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1554907346, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4319476007, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.4088183572, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.6176764064, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.4047612859, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5819091, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.314338998, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5302700213, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2500141194, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4962715087, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3219984327, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.541054894, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3581458342, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5653762619, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.2036645387, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.5772621757, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.6977660021, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.4597577036, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.6387649358, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2906050918, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5466988554, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2813982099, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5330166411, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2813982099, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5330166411, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.398736934, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5966252341, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.146297827, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.3702441703, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3225135832, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5152627703, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1643795275, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5226815529, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2376599226, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5552803049, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0747522735, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3917102663, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0759105307, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3680248117, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0042064141, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.1162416628, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.0795168782, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.1785438178, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2316746108, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.580510262, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.229202938, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5302965637, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1782141139, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5052627255, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2442398001, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5580259395, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1972611941, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5278567053, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3544044522, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.0019685039, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.193863826, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5282523989, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.3209133858, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.5100662436, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.3540078977, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.5545213531, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2118766389, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.436511399, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1995171046, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4153129741, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1175684385, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1358346534, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.160329685, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.37078357, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.5946653727, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.3656717313, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.5646486569, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.3455814845, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.5585506843, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.3193002633, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.5301066308, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1112359545, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3100651532, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.0618350336, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.233390833, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4578141566, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3057302575, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6305034409, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.2882291032, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6087031937, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4235901905, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6897643314, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4235901905, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6897643314, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5011893046, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7089203665, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.544344184, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7408492383, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.409628428, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6241258962, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4818632112, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7050536783, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3231928393, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6353582763, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3406014428, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.651454868, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4492327787, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6917786881, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4492327787, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6917786881, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4682583024, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.709053282, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.5105553787, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.445713314, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6723505987, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3652139786, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3824205406, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.4094748015, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4288513206, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3613816887, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3747448803, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3613816887, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3747448803, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3543037003, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3864890532, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2387702718, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3046917254, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2013754379, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2744903534, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.570227161, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.577208812, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.4054283524, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4160855105, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3740560438, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4097585581, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3835611536, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4136043954, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.4416093606, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4514750994, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3513670909, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3757759666, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1933336173, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2805662059, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.354165237, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3873954624, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1866741142, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4659033002, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1695069845, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4866898418, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1435764594, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4291039159, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0776207564, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3650474475, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2351665048, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.488505273, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2561279176, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5381058353, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1343270651, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3620549501, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3063252015, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5904333378, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2379983204, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5579014807, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2347703724, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5165217514, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.271198171, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5555651822, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2788268041, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5738319953, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1642430432, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4701596261, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1687770271, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4368481166, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.22415591, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4998179193, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4310064928, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6681893438, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4527112326, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.670898987, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.465608068, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6768276246, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.465608068, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6768276246, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4032823351, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6319223068, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4319870164, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6357518564, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4008289024, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.619515937, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4748655857, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6916379663, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4194404959, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6621110612, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4423448287, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6617260327, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4655412009, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6735988738, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.465085908, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6778737063, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5018812162, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6982877049, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3746293079, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6297969107, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4523633372, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6557435747, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.521658108, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.7189203937, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3977038259, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6202897864, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.5071615323, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6902107811, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.5071615323, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6902107811, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.5024073849, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6805608954, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.5105445285, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.7006788698, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4375567656, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.631435717, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.5531306492, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.7508908078, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4834225009, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6678984764, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4198435179, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6615330487, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4423392582, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6633703485, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4857904515, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6855885711, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4650185344, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6620634443, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4229886329, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6260112467, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.422714343, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6266965858, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2729012184, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4275664216, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3167585644, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.507686984, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1485909701, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3792046025, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1491315854, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.366133112, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3292454551, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2817018331, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5332946673, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1037736178, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3387746189, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.0907398033, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.4022599112, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.6108631094, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2575102349, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4697665795, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3212983212, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5599573621, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.4018590955, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.6025771205, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.0898114892, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.2560040743, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0923688347, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3472719366, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5201554059, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6912283535, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4411478183, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6241365711, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5525047617, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6971891435, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5525047617, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6971891435, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4286794451, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6365023289, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4740627791, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6744300843, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3531331255, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5770478823, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.481497339, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6355577992, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5280706683, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7101124584, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4744991305, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6720481842, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4946489713, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6635756951, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4946489713, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6635756951, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4999208084, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6982198149, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3234542278, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.565290538, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4734249555, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6791725069, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2548334123, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4565768361, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3542266509, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5643413029, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0798787471, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3626462425, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.113658747, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3589839129, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1828245612, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4754066124, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3634148418, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6061487576, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1991260766, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4079321426, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3721154325, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6214976186, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2998257683, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5433673039, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2921982022, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.52641662, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3142825719, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5843538976, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3721154325, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6246670079, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0607723401, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3407473281, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1747302897, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4004250724, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4767709962, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6259826462, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3995439803, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6021193793, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5428215192, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6623001914, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5428215192, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6623001914, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.406561839, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5890799945, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5703676204, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6860261633, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4148283786, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6168104641, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4995271502, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6422528647, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5142542955, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6424880376, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5285470049, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6459593469, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4500257217, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6204580993, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5050700247, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6475387595, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3614492694, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5766912416, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2787520741, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5095968929, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5576102994, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6640761861, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1651024006, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3792784923, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2993081269, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.477774296, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0816483251, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3152419985, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.079305616, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3127076148, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.123400578, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3331532513, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2533658571, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4526653761, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0857608867, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3280524714, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4695168707, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.6115882472, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4488093388, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5788970821, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.319619172, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4758634858, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3095674063, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4984720192, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1670991646, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4262476444, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.078021673, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3168167738, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.0874867177, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0125004762, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.1238327101, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3882322279, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5684042821, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3531289422, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5483853809, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.451478785, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5848017729, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5084875082, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6086126309, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5148124488, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6443063242, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3731480984, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5483607295, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.1954564368, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4554299243, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.6009332869, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7201156007, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.422018422, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5864023473, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.6427952895, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7611062227, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5908781325, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7135251492, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4051294289, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6289236919, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4267442072, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5873661332, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3202249301, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5240877864, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3021474642, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4948871858, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2589941365, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5932208557, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3473313423, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6495220842, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4431139444, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.685704628, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4404610867, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6852276536, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1560571823, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4855990297, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1862321334, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5434259794, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1292819544, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4539578151, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.453738261, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6984640606, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.5813201988, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7732878389, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4836134349, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7036055458, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.382488832, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6879676788, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4685867885, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7063293525, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2161144776, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5783999378, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.1382852021, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1943642066, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5437845507, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3315962079, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6420436747, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3319181497, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6296213701, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3644356128, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6333838792, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3644356128, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6333838792, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3239007562, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6320480882, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3645504394, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.64602226, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.233007365, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.56517708, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3728937116, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6577808114, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3859055776, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6651384368, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3668099117, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6472192231, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2912353795, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6107975281, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2912353795, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6107975281, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2132671218, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5636781797, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2493518765, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5378176061, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3199241797, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6151079711, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4876819889, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6502930112, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.5145500337, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6710712793, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4465062606, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6393035001, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4465062606, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6393035001, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6152720493, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7135410085, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.5631686113, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7184482394, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4545770467, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6181560715, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.600592056, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7065044125, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.5848425045, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6948793399, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6505785903, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7498687329, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.5099789059, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6591589669, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.5274166052, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6781556869, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3248172849, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5086455218, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.5609895347, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.681370247, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2500271341, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3785374221, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2942715677, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3867492388, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2921999208, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4387549485, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2977681359, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4349893265, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2923799211, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3727508207, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.129672172, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2760408327, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1837175088, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2588050117, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3995850754, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.508756357, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.067066745, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2609736646, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.282562585, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4403352185, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0814983556, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.228698086, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3730523468, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5149547593, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.4188415745, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4486815117, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1239416924, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.1983362537, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1767139752, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2956531698, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3920110588, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4224062857, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0560612491, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.2966788497, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.1361675359, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0505953041, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3965392443, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1265666538, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4038727424, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.076952541, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3675548829, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2243899628, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5106660073, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2041188644, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5209095485, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1727336938, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4962992067, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4033612274, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3514306358, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.1125396528, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3312806076, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2523482006, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4410174464, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.3095017642, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5048955319, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1173344637, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3700951717, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0604025945, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.1864421846, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.17878417, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4302346069, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.3896656594, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5661203321, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1446787739, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4125068266, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.3820277264, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5663085006, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.3422256854, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5722446403, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.4215265842, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.6140840595, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1882906075, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4750608804, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.3470953143, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.512413747, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0813654713, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3675681587, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0081523917, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.1288598477, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0848296457, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3705955245, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2282403145, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5807113513, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.3534880761, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.6311980121, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1846217209, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5452524689, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1846217209, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5452524689, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.068294034, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1478699653, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4453044958, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3149469319, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1337736598, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5270242776, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2472957584, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5673652711, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1073759565, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4590576572, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2261757041, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5681537359, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2920161125, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.586127589, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1610086717, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5252563866, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3548850735, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1786879144, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4923350572, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4597295133, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5915321093, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.1806974227, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3482690261, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5236428394, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3482690261, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5236428394, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3896357749, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5711687057, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3990118477, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5638068824, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.0830886515, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4154783518, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5523079444, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4560256554, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5819378877, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.361466948, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5217871952, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4062130996, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5705677722, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3785700741, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5432976559, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4197402258, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5789182839, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.1685104861, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.3926922642, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3519323937, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5556135973, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2529362973, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4763301335, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2387616111, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5060111681, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1099631745, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4562725637, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0628313651, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.3571654598, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2320768115, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5542533872, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3681328025, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5589462319, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1610181648, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4440198047, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.448885738, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.6217229022, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3721427288, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5776707489, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3685432686, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.6081703722, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3727416517, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.556253816, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.5270835406, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.6545175153, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1463099542, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4820045462, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0135286021, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.1839498679, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2677388259, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5587479208, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3124200382, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5563618146, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3355271325, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5622995574, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1350251422, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1318723172, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2453793855, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4929351232, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3340915684, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5881616165, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2231805576, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4839952646, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.13831235, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3735362786, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.619955729, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1304410207, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.4371703942, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.6644363101, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.5116998504, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.6764649728, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1413352773, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4869689368, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1488503723, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3683017468, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1391044164, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1974371441, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6726680111, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2935398429, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6951381337, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1859329553, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.631265189, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.196988755, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6426381622, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1250254952, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5134519177, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1307849908, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5671925387, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.1611436859, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3138115023, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6729359212, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2762254294, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6512210578, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2485715476, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6619189738, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2443332859, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5746305891, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2863192243, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6564670371, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0964537814, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5692397578, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4609236579, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.253232599, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.634050238, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1643888714, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1552450511, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1689634884, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.184184846, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2146050139, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2491614164, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.1133562624, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1938403365, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.1298713855, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1885296553, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2907480532, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.3256819926, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2941832965, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2902230142, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.21156471, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.3764522334, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.3811591131, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2802334144, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.3051135603, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.1936886643, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2507668706, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.1191782938, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1612268034, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0915897145, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1604651736, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.23258136, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2968944499, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2196687819, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2853191119, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.238500021, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3189153082, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2332550586, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3221663487, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2243394826, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2821830229, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1563935126, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2473109072, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.128606125, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2214367565, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2221235627, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2906383282, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.082209595, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.1824247101, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2078787665, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2756656982, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.220677136, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2933989965, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2286976241, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2991217929, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2509281474, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3278628963, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.1715121044, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2107529339, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.289382195, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2167171226, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4510971286, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1906820165, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4726429207, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1840222131, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4631133991, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1840222131, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4631133991, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1832966985, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4594348688, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2167171226, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4673219674, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1225677725, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.3888459546, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2169620287, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4542389366, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2181668162, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4653734296, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.222954993, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4776623789, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.222954993, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4823001774, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2181668162, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4688447561, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1906820165, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4764825215, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.052213612, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.3400818525, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1703756775, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4461042775, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.1862014063, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5607456809, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.378631625, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6635410443, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2196114713, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5737658144, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2141579644, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5842832527, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.1972918019, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5692505098, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2055897037, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5814353568, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.142409791, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4730976332, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.1949122053, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5624690189, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2588604689, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6034516114, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3413326582, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6366815218, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3800346951, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6452882639, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3783339819, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6593521342, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2688635993, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5762551633, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0698131466, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4083625992, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2174421311, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5984930471, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.4275132191, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.6183948028, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.3384715911, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5853748389, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2707674447, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.494047093, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2707674447, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.494047093, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2270708175, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4862454682, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2128686476, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5101291767, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2128709461, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5097666837, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1988963683, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4442470563, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.3094522455, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5630983761, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2318174546, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4951093505, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2403887065, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4991655088, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.3830336678, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5620304431, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2112396309, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5078608171, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2128686476, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5101291767, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.3252422367, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5722293207, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.211110883, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4027988647, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0998605829, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3687157022, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1663169311, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3915983161, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0696414571, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3249164702, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.0727643305, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.321161366, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.2330817485, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.2221855207, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.445074868, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.2702057908, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4678766242, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1769916336, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4185787405, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0955343712, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3595876505, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3118241997, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1245054566, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3479769018, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.0459019971, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1702227105, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3935747186, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3790620537, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5725673261, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3660196411, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5845337385, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3645571064, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5144301079, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3645571064, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5144301079, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1812076974, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4487884877, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1883530449, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4304723289, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2357204508, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4656429911, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.4609248607, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.6626661413, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.4174698824, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.6502382958, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.538744282, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.6904491114, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.4282802116, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.6473023221, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.4526263247, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.6652966172, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0703435502, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3516259272, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0667231966, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.2955579945, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2316834412, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5068903585, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1330961609, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4502513659, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0872277849, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3364641575, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1476568105, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3849224617, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3775112601, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1186406395, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4500029014, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1868832039, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5004399872, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0517284328, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3142433455, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2472151143, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5442406939, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2718532633, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5585854392, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2959455735, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5713837604, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2168805396, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.506252536, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2073783805, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4984632492, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3252087252, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.2861595665, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1235794498, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4078633867, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0519226945, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3186059151, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0783823186, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3561023398, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0355853226, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.2801274743, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0454303441, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3455689507, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0048954756, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.108791208, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1036966012, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3325279132, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0548781427, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.282759158, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1839647698, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4671696314, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.185657203, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4755242092, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1623190728, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4612755575, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1510126214, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4308753906, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1693306015, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.442736392, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3134098737, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.0679967534, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0999760385, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3427128418, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3404484092, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3095271693, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.050197822, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3726436019, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2897115086, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.1389171241, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0429897354, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3035138538, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.1200764997, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.5840778022, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.7188523563, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.5258041464, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.7156057074, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.088510343, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3542044128, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.141801777, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4442326904, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.3561981736, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.5123206369, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0685512539, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3194983347, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.0283968509, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2233695139, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.402078841, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3117704018, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4919255848, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3724642668, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5209584151, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3262468942, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4858600082, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3262468942, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4858600082, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3725023982, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.512216193, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3669823181, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5161342211, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.1512297572, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.383796897, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5441603162, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3683384333, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5353541957, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3747706572, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.520911792, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3049239316, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4954261476, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3642849608, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5223164971, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2402463216, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4527249312, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1031071355, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4087956994, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1572052717, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.3752206868, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1225899828, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5014302476, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1598423262, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4759652107, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0526688585, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3551300147, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0571917804, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3600549295, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.1058560062, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.0784731852, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.138517213, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2764596646, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5766041891, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1165138975, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4750693558, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1046807503, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4004016785, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2981795569, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5420613612, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2999813281, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5482034618, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2717321002, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.0382808667, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0673146215, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3947663332, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1813466966, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4176673378, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.153620195, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3943316917, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.0833358065, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.0759565169, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.0696244153, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.0035612536, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.0025237298, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.4755605012, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.6011398608, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.3048688484, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.423110719, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1520434987, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3544354828, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2582643227, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4622766761, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2130807529, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4585809667, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1249829152, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.123122675, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.2944327586, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.6021903435, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7189230568, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.6837528315, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.796878989, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5810419951, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7223623051, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5810419951, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7223623051, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.439168416, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6371098202, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4063427008, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6422753362, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5124564256, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6584075129, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7191192065, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7900451518, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.645705467, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7698170823, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7555875294, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.8049022687, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.6443411341, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7335999563, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.6178921921, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7038448765, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5127683744, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6392337104, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.228536965, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.4750387664, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5975003598, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7683913391, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.188779623, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2360941227, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3593909828, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1700831187, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.27468331, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1700831187, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.27468331, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1273192736, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2223196142, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1280769531, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2077034261, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1138070635, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1874120296, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3487145359, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4856442516, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1628360068, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.274359209, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3360376952, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3529764045, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2168721879, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3565912503, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2652905483, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3682977697, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.0955413803, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.101783917, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1454906008, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2205462076, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.121068786, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3192454013, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2364905318, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4127382175, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.1414434097, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.139205063, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2392792151, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3886781036, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2235625288, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3697725657, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1578901416, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.1269046174, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3259738911, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4954841707, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2971168749, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4617842176, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3410136463, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5758572581, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2026639469, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4471011187, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2826834683, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4501358343, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2319385727, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3940880854, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1162232342, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.1082669441, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1800487821, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3772586334, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.6297960259, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7117676662, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5701358971, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6801332691, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4820227549, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6179256582, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4820227549, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6179256582, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3493356358, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4827709278, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3165483199, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4908122137, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3145581712, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4688436985, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.394781294, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5373384618, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5701358971, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6801332691, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4692880638, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5773610755, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5796814084, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6364369549, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4632588853, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5787305109, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4438274412, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.52386826, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2985280444, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5072627289, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4940219502, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5838214856, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.374755902, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5491788682, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2130536898, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4371748198, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1517019713, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.3872481255, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1682934919, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.451564263, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0891995195, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.2986174009, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.141046542, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.395660515, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.1020614051, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4176763689, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6124700717, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4321664312, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6410028391, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3879155257, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5723637874, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4305675865, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.63125083, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4305675865, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.63125083, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.004789272, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.0119734565, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3002149853, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5378189161, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.2623806582, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2087690008, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3981381071, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.2178236786, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.2135544528, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.1582263259, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0947765738, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.298513575, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1086652236, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3211814423, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3184011333, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4757795896, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1840870717, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3935933505, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3530704023, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5215303819, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2157485457, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4194032371, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3361543946, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5097369506, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.1441526878, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0588540978, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.1724001922, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.2342589159, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.387724069, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5570859362, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3791776666, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.536579445, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3166333841, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.4824025636, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3166333841, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.4824025636, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.2332914593, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.442914754, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.2422764842, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.4614682757, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.167208803, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.3830062024, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4097762807, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5623921018, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5197186862, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6387638037, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.306263798, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5077543267, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3886170745, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5432656354, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4014604107, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5559363995, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3092470769, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.4978251801, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.1770633309, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.4047932836, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.309041043, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.4867705634, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.329735821, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5062241575, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.322130529, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4866081657, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0553784778, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.2899958464, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0553784778, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.2899958464, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1056380936, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.2323275602, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0754574024, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.207199644, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0795410773, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.2990326103, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4592557039, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6121399519, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4926928485, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6783058706, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.378184476, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5516941276, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3459197398, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5197016246, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3016434352, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4694223787, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.112207907, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3598119302, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1002099771, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.1632777804, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2447019277, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4583472828, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.6077585259, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7400152007, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.6260375038, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7803415401, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5078162248, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6905875293, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5078162248, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6905875293, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2961648174, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5022745285, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4214420672, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6448871869, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2973155467, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4888827116, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5803184115, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7598708285, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.6359088668, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7818086764, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3744682, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.596599571, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4723708689, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6521003934, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4723708689, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6521003934, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4311779921, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.605767675, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.3186701835, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5261433842, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7092550338, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.2511746528, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3146726147, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4709531556, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.1541396341, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.1541396341, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.1397878244, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.1518242214, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0754393839, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.1621827389, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1898569805, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3803223838, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3000233133, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4363867386, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3223419048, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5205977846, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1764046492, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3464061249, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.1550323329, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0843539602, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.2005359552, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.1885679994, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2046670174, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3025868321, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4033294752, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6228862505, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4489843852, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6143783255, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2512754001, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4828406182, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.309168597, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5135112084, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3688091032, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5618587772, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3586319156, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5648853941, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0947238193, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.1115471187, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4315589035, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6190094476, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3065593461, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5311466716, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4918904748, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6551168488, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.145608516, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4152567008, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4895484391, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6562187219, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3382368481, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5521518994, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.3028483518, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3991070934, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5925781167, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3958704329, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5196505496, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4850978822, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6352541214, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4377997022, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5678763862, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4377997022, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5678763862, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.15978969, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4908696279, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2986045492, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4455663313, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1905028824, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3175856028, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.5117916535, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6878657355, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.5379676902, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6655488114, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.5420104448, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6785083782, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3603330051, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5012711439, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3603103614, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4864225703, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1717511667, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4084335314, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1975941307, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.2752059719, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2983588345, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5041326433, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.5354397296, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6627191682, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.4961226772, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6218353723, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3857808913, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5169273955, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3857808913, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5169273955, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.4254337673, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.581887391, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3495970095, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5356888229, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.381830829, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5561897012, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.6743633529, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.7903753469, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.6000288092, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.7429500653, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.5781534325, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.7443062675, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.5809669143, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.7168714328, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.524831709, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6414304239, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3976353644, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.60373356, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2102569642, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.3908019352, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.4392975118, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5889147221, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.1148153812, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.2054979156, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.350184784, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5180344375, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4105639022, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5404388903, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4339080814, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5601377135, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2119537141, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4061072765, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2209496766, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4276390348, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.1028912425, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.2070803789, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3554804781, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5288950977, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6348377556, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6773728017, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3483718729, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4980927055, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3248895898, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5442618575, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.335717151, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5153790879, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.252811687, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4299452816, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.1178130184, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.2021918626, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3511112514, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4736008842, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.4440478276, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5596520713, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.4161837774, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5456804815, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2248526056, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3876111278, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2248526056, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3876111278, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2336021028, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3931394603, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2073747906, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3654501419, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0578479682, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.0923979408, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2977932227, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4543890393, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.467732238, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4647428083, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2225673428, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3765773373, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.4575089222, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5374740663, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3836655982, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5374740663, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3114281969, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.45383015, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0578083904, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.09190081, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1704823945, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3342299669, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.4017730387, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.574816216, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2719326877, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4943569701, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2026214534, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3813079901, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1911176502, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3548997321, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0977573237, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.2027374712, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2302608192, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4630122713, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.130651133, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.2170867394, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.457068278, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.6043967968, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3806307491, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.558044293, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.4641849274, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.606128856, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1886552453, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4391044715, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3187378316, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4900083865, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2431364796, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4460325653, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1136798693, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.2241654517, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.27865261, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.422788034, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1696179559, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3473249667, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1513162576, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3665181321, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2173763988, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.2499606038, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2173763988, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.2499606038, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1073120515, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.1863606235, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0947457826, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.1734003948, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.0297809532, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1716685265, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.456269453, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1211033492, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3845930522, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1751636962, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4465249673, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.162139429, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4239095999, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1247117524, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3393879612, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1191364873, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3300153785, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0885638721, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.1467534744, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1859941931, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3092478317, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.7409995287, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.9017022389, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.7096224668, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.8862932371, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.882190725, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.9431233924, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.3979309387, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.6648788692, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.7147882714, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.8408773556, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.3359230828, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.57308612, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.7106361352, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.8390104108, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.777055454, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.9260678177, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.8767740197, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.9055624233, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.8627586294, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.8964369717, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.9082489096, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.9677853955, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4178102249, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5541365812, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5425651337, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.657385166, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4378498065, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5570867906, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5166819833, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6450630416, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4504787314, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5879031109, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4231763152, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5646316458, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3242957438, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.442383555, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5808022164, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6627998165, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5847143752, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6677870097, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5267859046, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.66640551, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5090592077, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6898128904, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5494728225, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6505680719, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3698191282, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5379681558, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.192945074, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.2034303285, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5464960727, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6338335575, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1191857202, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4234617627, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1846760813, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4612761981, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0749880436, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.322429547, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0747095515, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.3255729229, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1164634565, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.414592372, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.1879992779, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.1897174996, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2030347987, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4994712399, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2562052802, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4919666752, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1638236366, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4680776468, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1018416907, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.411121601, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1270469748, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4390040485, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.27749478, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0980207484, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.2574156136, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.3915391819, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1565461944, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3361013163, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1379310072, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3240963506, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1450274049, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1450274049, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1064532132, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.101636806, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1209627796, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.0999177768, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1480417518, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3781211342, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2098353971, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.428066526, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2034128892, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4150437746, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1964445362, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4060267989, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1666608456, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3746696825, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2635248148, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4250802969, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1191667008, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1688552309, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0733604961, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.292435357, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3004299909, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4693080732, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3925406773, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5373872823, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2837965378, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4275818989, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2873543606, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4564363265, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2964997392, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4458620902, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2712458796, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4127186604, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2738616869, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4556817349, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.4053606506, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.55788953, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3563341748, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5388531567, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.4378847364, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5875237951, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.349595139, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4727844502, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3448260128, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4979112232, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1635068195, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4252045956, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1936794368, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.2703053606, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2723565577, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4477697252, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2029302654, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.1150211961, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2826072681, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1944112173, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1898118992, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1890523863, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2094352327, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0925284622, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.3628617912, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.4006532486, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.1584528066, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2274011212, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.3029246309, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.4012206533, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2083217829, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2168179115, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1525635461, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1180809808, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1883725578, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2623758746, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.357462207, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2600563389, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3234798829, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.222892194, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3382837811, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1919457048, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3171637914, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.3391071441, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.4066486585, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.279103657, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3447941294, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2897781371, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3668617746, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.3459946201, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.4287694937, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.4817073354, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.5422050631, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2922288165, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.367499064, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2159291981, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3174152476, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2228217149, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3388318294, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1112346978, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.1506769208, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.0356143901, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.4452444344, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.5114675835, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3360386791, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5211853612, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.216755068, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4463601824, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1456802428, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4239962379, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1456802428, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4239962379, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1743271271, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4068910883, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1453624703, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.3719956686, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1346282624, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4060253336, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.215541824, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4433895652, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3996351663, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5955868995, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2138276008, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4314761329, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.304787443, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4853634498, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2975561329, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5046099634, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.225593647, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.439659789, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.0638707075, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.2924377768, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2454457226, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4543069356, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2698452317, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4582070027, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3011454888, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4262131523, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2324022445, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4133384318, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2370996127, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4151768755, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2286020569, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.3182044233, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2621312439, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.3668283434, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2822052108, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4198020226, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.327270155, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4507432073, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2866246702, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4336774105, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3211041147, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4480786241, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2791328216, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4260697289, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3232950817, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4734532656, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2415462491, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.3827297945, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.1874127687, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.2766384575, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2593593634, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.432716743, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1632548713, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3165500484, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2226908477, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4278034123, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1745413053, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4080884742, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1696644941, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4003039896, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.1452031827, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.0296116252, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.1445040072, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.3304287005, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5073607254, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0943246419, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.348055533, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2351948771, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.38703231, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2051918387, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4546635461, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2134578088, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3859086756, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.2371342683, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.0366033491, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2175733313, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4453992356, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.2006128367, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3495758281, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0799827393, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.2553179648, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1476468805, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3128469009, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1450081672, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3173242925, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0440526439, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.155576245, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0407455503, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.1496552105, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.1484241683, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1167687752, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3390310486, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1479505099, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3451106706, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.153698956, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4476290114, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1912081758, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4096925023, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1708351702, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3915073554, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0647149802, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.2882933468, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0646129461, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.1528345554, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.2631405488, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2096209585, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3677788424, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3273734954, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4740682101, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2841613006, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4218648611, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2807428199, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4058440896, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1668073758, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.2663384155, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0788254359, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.0963282471, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2425912272, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3488665575, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.4322305878, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5066667713, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3787768943, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4634054471, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.4740262814, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5891073642, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3797264331, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.511342492, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.397061081, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5301051151, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.0756968045, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0811511315, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.0960638002, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3751172096, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4914945427, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1437669048, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3557201485, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2010029286, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4076276305, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1107840269, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3052404531, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1146310497, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.290986151, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0939075792, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.2124815759, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.1569787206, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1669091071, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3273742854, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.4135342006, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5332641004, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2132210003, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4136653534, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1637342874, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3881970983, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1050275399, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3683025402, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1174266534, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.365633453, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.2461057262, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0526762561, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.1535018229, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.135534048, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3371278821, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0904900874, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3899650893, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1548512533, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.316352438, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.1571006265, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.181294398, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.153822641, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.1340819876, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0783962175, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.1846437553, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2622163182, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4929088971, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2243179352, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.396042274, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.091600603, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.2288450359, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0824179698, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3466608728, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1213408296, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.2682674586, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.2373706275, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.1348260373, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.2697371983, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.1648883063, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1076363912, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2286324938, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2156248011, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2122236503, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0311567798, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.1664642062, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.1462616347, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.0023775559, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1563179699, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4199470043, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.116470837, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3623662722, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0772736318, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.369854723, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.144245043, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3278751519, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2677155318, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3794964997, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0651036529, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.1687003584, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.0713277411, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0627129314, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2665116614, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3890491199, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5272334689, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3366798594, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5032290576, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2455276401, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4595968294, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.293799467, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4721695545, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2851452081, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4757962295, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2557023064, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4734137274, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3130976818, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4792341787, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3707982382, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5308246783, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2618412981, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4539571997, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3695120663, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.540195675, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2665610582, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4687918044, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2665610582, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4687918044, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1479420557, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.3647509559, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1017422636, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.2235019521, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2648080421, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.467419629, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1666398737, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5129077754, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2961436724, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.6045301048, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1347107589, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.284323294, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1347107589, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.284323294, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1432084252, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2864172629, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1051524572, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2183311032, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1381756742, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.261952816, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.444969586, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.6926365319, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.4113509023, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.6201370796, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.4108322478, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.6633295107, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.4113791262, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.6958747658, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.3628537127, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.6272308931, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0928538035, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3336498305, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1057078597, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2119804511, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1136832002, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3573231052, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1465869851, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3019087046, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.3199269653, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4634857364, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1706615063, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1706615063, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.122554084, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1211046862, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1121601173, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1570619085, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2065671631, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3866003891, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2960694463, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4881747008, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.2496610332, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1657794582, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2349230687, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4194990056, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.0349473082, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0883484497, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1986615589, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0872815278, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.335710002, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.2468849867, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6300112897, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.8107492451, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9000327478, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.4294674116, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.4294674116, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.8761560783, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9484564543, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.8761560783, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.92894163, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4168218947, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7823629306, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.8761560783, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9484564543, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.8761560783, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9484564543, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7406375009, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.916098851, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.8107492451, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9000327478, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.1619557013, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.5142740246, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.3132252321, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3502541231, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6825372618, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.0912294176, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1372586106, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1114738485, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.0519478915, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.0519478915, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1350501876, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1114738485, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1350501876, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1114738485, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.0682114861, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.0793331743, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1350501876, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1114738485, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.0940802474, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.0989535892, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.0783995141, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.062613895, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.115381841, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.0920426804, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.7608566263, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.881580297, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.8395876231, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.9096086669, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.5054091116, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5779798191, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.5054091116, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5779798191, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.5821747318, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.7539119883, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.6885326215, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.8229812189, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.7608566263, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.881580297, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.5824621546, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.6375144449, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.6885326215, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.8229812189, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.6885326215, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.8328652216, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.8395876231, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.9096086669, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.8395876231, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.9096086669, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.7178970818, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.8295858853, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2516966959, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5710821659, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.7498810286, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.7886148242, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2652951833, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5966999603, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4122954704, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.705800771, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2592170537, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4896263152, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2592170537, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4896263152, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2104783779, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6117499552, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2104783779, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6074381661, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2371332025, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6388309463, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4747354911, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.73602868, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.1985082374, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5458763572, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4122954704, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.705800771, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.589811312, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5838763482, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.1895162957, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5476491103, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.3107293146, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4306285423, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1435622312, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.457146715, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1417229241, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4762857001, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.3022474973, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.3022474973, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4800955244, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5401265647, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.3512368105, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1848293624, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5172215727, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1786870215, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4652953619, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1623467672, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4813797008, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1685379097, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5242065098, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1581263595, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4522083091, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.14384024, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.465162974, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.0781023539, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1040157761, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.3225233643, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3124325728, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4415757259, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2185059453, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4049269026, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3327803453, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3327803453, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2123347059, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.363001639, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2721438001, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4244951818, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2185059453, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4173980391, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1958598295, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3998957846, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2232587706, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3876087373, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2741229265, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.372165735, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2741229265, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.372165735, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.155731889, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3440012233, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1617059616, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3380502395, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.2339819753, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.1935951734, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.4366770287, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.2466674258, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.1591242577, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.3684978836, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.1338016138, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.3620746906, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5677534942, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6843296717, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.6239771259, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7203812768, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.2373131971, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.4750592895, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.8787419089, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.9422733087, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3463101483, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5237307225, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.6666935927, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.788605988, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3854501214, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5957790238, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3101157575, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5868493159, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.1994044599, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.4140097711, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.1999934463, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.3052045715, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3734832063, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4454332372, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4678134834, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5051480557, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2952824242, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3327828516, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1985082374, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3322089543, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4028998029, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4342233882, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3734832063, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4454332372, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3333887486, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4116646458, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.5894159589, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6334377633, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4742664049, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5335499797, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4636073106, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5726015902, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3734832063, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4377193699, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3906219304, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4740791147, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3357306484, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4290137254, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.204140515, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2728627799, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3659203478, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2669741196, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6328956554, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2734118505, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.641165185, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2012189247, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5567939083, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1922854475, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5417764306, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4041187387, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6888233111, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.9086549611, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.9538780145, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4762901942, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7299685604, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.670001214, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.8763862761, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2089185389, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5547930109, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5645815242, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.8151453923, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5972046851, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5972046851, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1587437613, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5342000553, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.2457040883, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1747094296, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5699365673, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4388504279, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.8080705633, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4841156774, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.8256726071, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.8482942955, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.9256238041, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.8363600587, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.9912737183, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.8895260356, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.9215559913, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.6018154976, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.7669980679, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.8482942955, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.9256238041, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2117127348, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.3468080195, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.2748321185, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2095142894, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.2989889871, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2095142894, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.2989889871, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3332411633, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4039853785, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2218501907, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.3365436883, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.1173220105, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.2529983602, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4081354057, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4795517466, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.6068206304, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7266797932, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3920224697, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4805950433, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4081354057, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4731088237, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3332411633, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.3993319311, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3627171579, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4226591811, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.2064217991, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.191785002, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.3514233824, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0993195473, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4660581947, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.2503460073, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3123576616, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3123576616, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1402577516, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3730666925, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2780527232, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4881594142, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.2126774619, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.8663975518, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.9369949537, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.5278627722, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.815437935, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4168218947, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7155178722, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3742031646, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6713980678, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2615311775, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.616916927, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.2823945344, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.0952064686, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4231985179, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3725133799, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5810872573, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1949624908, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.3404780052, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.3216265867, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.3631346017, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6488446911, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2901896324, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.542847577, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2622067644, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4004199534, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3308478035, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5879159713, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3222538602, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.596995731, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.7708186875, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.8284786787, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0860352072, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4178507188, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3779384373, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6768016165, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.3077932519, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.1756588074, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4715757341, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.1833170495, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.468167493, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.1481394579, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4346232049, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4793144467, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5290208229, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2610490903, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.595606837, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.446338868, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6877687248, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.3296143242, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4546852632, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.765409184, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2021780304, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4743589083, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.8492326636, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.9226314544, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.1481394579, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4278722852, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4952330116, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6324855803, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.1243672209, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4638123954, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.1000835074, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.3399171525, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.3267507236, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2180019396, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2974641182, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2082883818, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3002418281, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.1494292792, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.1494292792, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2234473632, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3517185856, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2234473632, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3517185856, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.0738924501, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2530618806, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3181932376, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3060737551, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2053633774, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2362100396, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.1700448692, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2082883818, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2985584273, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.242505662, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3842334003, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.1410292911, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1670235608, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.321843152, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.4626955907, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5813300951, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.4962806188, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.614275434, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.4751132439, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5331125669, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.4751132439, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5331125669, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.6813997516, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.78395749, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.7964269517, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.8589615671, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1365189729, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3779992936, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.8395876231, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.9201441894, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.5338072106, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.6564887792, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2434330428, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4684960451, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.0030750308, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.4526353562, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5592911782, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.4901445174, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.6491845646, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.0135429667, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.5784879107, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.568310442, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.3033668866, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4694590303, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.4499781507, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.525580448, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2066418182, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3233016465, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2066418182, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3233016465, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.3121192034, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4859322738, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.4290255654, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5591695776, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.4028998029, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4615263916, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.5275959726, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5562472188, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.5275959726, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5562472188, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.4884391792, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4656933855, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.5255781734, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5338694785, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.5680635025, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.6428616303, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.258230776, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4462632944, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.2352761276, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.4742664049, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4991169087, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2131456897, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4218207205, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.2874301159, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.209648485, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.2358742866, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3087246122, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.3254777991, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4305243634, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3239539357, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.280395012, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4428879051, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2195152443, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4204505859, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.3807134866, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5378980705, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1966781229, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4001212148, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1966781229, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3952782445, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.331564978, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.2470906323, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.360763266, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.18038303, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.3896135507, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.1779392575, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.2801288821, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.0958506163, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.189320267, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.1992392873, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4663425113, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.324077955, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4812338547, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.2338469458, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5096772803, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6511024508, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3898369139, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5816984404, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.458735768, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6043854821, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3485638068, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5963375644, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.1670445271, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.3361164828, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.184589582, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.412776958, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.1408591642, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.3380482597, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3341317422, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5079573405, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3861304706, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5248223978, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2974309562, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.3992519602, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2745762486, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5002984561, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1581578341, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.2976997537, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.416179145, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5532809971, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0086913203, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.0560457455, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.5131341854, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.6909093149, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3916177036, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.6036101601, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.4588667801, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.6644271635, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2315288896, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4544566268, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2819047151, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4860988074, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.4774025962, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.6645173033, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.2332467588, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.3222841628, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3029955224, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1059399151, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1076318077, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.0975916076, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1196835473, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1296705297, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.0026709402, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.29277966, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.2352229157, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.2646447028, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3535161075, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1778589789, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1191061089, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1576487987, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1259689163, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2476165058, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.486714651, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2476165058, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5008770061, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4516694906, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4516694906, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1646702986, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4015922868, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1577454598, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.540468595, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.3291681797, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.7541859578, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.8925780651, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.6028817682, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.8184572216, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3541296817, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6270889448, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.2535705448, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.4484416535, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5718331963, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4825577531, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1584450134, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4556529075, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0668660749, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0821446512, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0434223223, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0434223223, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0592105263, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0655505944, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0425352903, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0846491228, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0911327443, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0668660749, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0902352719, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0821446512, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0764798324, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0069444444, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0682355626, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2021780304, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.1440757646, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2068791305, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2282895423, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.0412755409, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.0412755409, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.340021562, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3371988034, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2610490903, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2722033387, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2116210665, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2393259522, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3110126616, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1792334464, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2344967623, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2227227312, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2677055448, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2123347059, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2655126466, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1922854475, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.1405962417, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.0678700275, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1402577516, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2329160566, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.313100708, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5511747373, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1420515519, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4410628158, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.269677842, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.269677842, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.3648139825, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1420515519, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4410628158, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.3277723031, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2154499273, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4386201136, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1746000523, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.400676476, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1523461046, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4672690828, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2281739544, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.533351248, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2269006874, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5346629648, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2696565255, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5248534525, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.2181331172, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.425183321, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3617640392, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5522465855, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.2418733936, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.2575658061, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.2575658061, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.3163161243, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2368768539, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4980341077, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.3368689095, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2569984871, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.521874364, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.250450345, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5561372886, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.4004366632, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6786513775, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.1847170673, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4757529329, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.1846205354, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4770609531, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.3104807892, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.2922953335, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4235355276, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1896632646, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4171144217, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.3276463795, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5691582878, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1797645143, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3585067888, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1797645143, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.343282119, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.145821488, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.310826964, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5327899254, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.2750129589, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.6880908437, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.8057610215, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.5446619336, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.7009531476, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.3114222098, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4451027034, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.4331536929, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.6392185687, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.4331536929, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.6392185687, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1872867463, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3939325011, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.1878901082, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2690293753, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4926185189, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.35880981, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5299274111, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.3401185072, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4698914884, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.3595597536, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4807768458, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.3595597536, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4807768458, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.3707191241, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.521509471, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.3530655324, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5388344492, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.4023221174, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5438807583, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.3395665609, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4640706251, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.3317190809, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4513622173, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.3401185072, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4698914884, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.3395665609, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.486902294, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.2560951677, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4490809853, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.2242250471, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.2278371391, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3867932684, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.2006312662, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2115210387, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3736035604, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.1259725704, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.1870083099, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.2227147729, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.1045990548, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.1880220063, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1881368725, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3863148949, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1561312219, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4269463655, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.2657895901, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.1777383986, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.1614992736, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.1522111816, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3040820656, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.4081124129, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.6001792982, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.4354676265, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.66175729, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2662204449, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.334569238, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2665965212, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3823133137, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.5105137894, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.559110419, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.5502408885, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5654268255, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.194457249, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.2659249674, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.7092625431, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.8127893086, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.7254204378, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.8078563607, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.6823528627, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.734021738, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.5608429424, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.7377212542, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.5184760553, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5428419285, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2033344819, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4584540305, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1243018504, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.2432739373, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.5577288804, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.6039990179, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.491736538, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.561226022, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.4799236604, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5677112073, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2837655733, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3548188786, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2837655733, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3510899956, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.575116764, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.6677474341, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.5303402316, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5507521835, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.3433574272, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4383902107, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.3881559367, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5906846754, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.5792154834, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.6702416408, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.5486578344, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.6828178383, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0506020721, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.2602202273, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.5366441956, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5916693427, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.4756289336, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4877017848, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.0230224296, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.4755160782, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5834441686, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2435604214, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3927355784, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.3267294026, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4333271066, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1940607133, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3533983916, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2220510845, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3592356435, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2721315717, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3876323908, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2293643619, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3476847059, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.0032051282, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.5502408885, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.5526384139, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.3863093619, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4399981142, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.3479992308, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4316731144, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2117146063, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3679105846, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2117146063, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3679105846, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.3401950627, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4187587391, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1983704639, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2458215335, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.335417686, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3669951215, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4183719657, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.2284240389, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.2546939136, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.2546939136, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1590542799, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.427734116, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1466968641, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4749329376, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.2702173841, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.228783865, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.6264262129, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1472821272, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4883679712, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1885651765, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5377638658, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4336051762, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1967421487, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5589633489, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3234249855, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5669007627, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.1476770699, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1475758119, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.516137029, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4281598089, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1881846806, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3593727228, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.1733970492, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.1992260278, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.1502529053, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1866149123, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2422432795, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.1742174981, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.3878561122, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5025112454, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2706380286, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4725085408, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1939469894, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3735791805, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2291421308, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5494313752, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1260770492, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2724465904, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1267371854, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2342177526, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.1972968047, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.1971221255, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.126131227, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3636196383, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3444628324, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.204212837, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3883201121, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1997880199, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3566648944, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1418976346, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1396681036, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.167709495, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.6695580814, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.6418894961, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.5249562834, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.5698312266, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.3090705808, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4278716169, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2298686471, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3934151437, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1330986798, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.120132695, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.2234766909, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.8003203204, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9453478043, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.8003203204, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9453478043, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.8003203204, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9453478043, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.8003203204, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9453478043, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.8003203204, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9453478043, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6417603075, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3770929789, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6881502501, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.8003203204, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9453478043, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.8003203204, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9453478043, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.6219720159, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.6387580397, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.7215691881, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.7351007898, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.6517181973, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.6481167034, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.6517181973, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.6481167034, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.7004877183, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.7205373993, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.6219720159, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.6387580397, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1014359122, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.6118437608, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.6194911485, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.5796016058, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.5650600724, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.5894567062, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.6051783687, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.5907010931, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.599558184, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.7215691881, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.7351007898, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2860852305, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3712901521, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.335005994, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3437111739, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.630923554, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.6458808155, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3175465093, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2028736642, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4345894779, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.2614502001, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.2614502001, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4033902613, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1143480002, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3575409422, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3331873213, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1359834555, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4135396704, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4007426084, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.310115928, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3909330179, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1296247288, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4770091941, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4077182885, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.2172954097, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1217311552, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.390454451, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2293530952, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4689601315, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3820562307, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5488313413, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3820562307, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5488313413, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3820562307, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5488313413, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3820562307, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5488313413, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2855261947, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.519791464, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3820562307, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5508290064, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3820562307, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5508290064, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3820562307, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5508290064, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3545968453, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5519360559, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3545968453, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5499993547, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3820562307, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5488313413, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3820562307, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5488313413, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.270623955, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4407436717, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3711335186, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5595427509, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2327428511, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4091360044, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2318983523, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4415779783, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2324422363, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.3902749945, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2324422363, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.3902749945, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1191775699, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.3785009332, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1290151804, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4291066974, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.2185876061, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2325135538, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4298699159, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2318983523, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4308975097, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.3330732444, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2372131719, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4319465814, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2318983523, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4056332464, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2403479326, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4050255206, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2941711396, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4653698221, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2308824748, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4282830335, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1551155009, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3922184662, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3143012009, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5013155459, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2471508732, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3982414931, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2471508732, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3982414931, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.164519294, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.2957279303, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3392650036, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5185478415, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.179231693, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1079358383, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3079497312, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3049259527, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5152417158, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1140128225, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3117911565, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3401950627, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4870855839, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3285767571, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4464566565, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.1726095572, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3318416645, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.167613689, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3891469266, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3216398971, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.4414323713, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3722001929, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5252698639, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5369357392, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5925671678, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5369357392, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5925671678, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3514475288, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5361569876, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3065373522, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.470197887, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5021151726, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5841884403, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.2091383814, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.4096009403, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5369357392, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5869601651, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.2791475974, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.3958350232, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.2097473307, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.4145586808, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.2091383814, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.4096009403, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4572970761, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5446642967, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.1608653162, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.2797876941, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3277803742, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.4267708983, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2287219601, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4508985758, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1258907883, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3414364807, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.33124278, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3489311424, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1198680995, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3462946766, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1697800812, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3589878684, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.168504816, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1755035418, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3977547522, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1891005485, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4671115766, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3266618117, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5670457943, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2917592978, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4529901075, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1591961279, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4455676021, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.30531852, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.2446391069, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.2908660541, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1383690338, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5516548411, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2829559628, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6067794554, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1359779634, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4484665724, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1359779634, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4484665724, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2086328321, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5109257435, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1415394535, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4466955096, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1478596781, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4646009041, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3458989585, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6136307265, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.233210787, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4758513477, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2810551684, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6477048454, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4732656865, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7021422986, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4732656865, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7021422986, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1307201098, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4862878243, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1181001951, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.3708545153, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.342337572, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5343801173, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1155665376, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3140069932, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1175771443, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3103572691, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3024842516, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3090152221, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1262927997, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.2933944065, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0808989823, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.2571823671, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.1956356196, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1055629359, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3048267146, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1250851987, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3057389265, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1236325137, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.2692822155, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.2447065115, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0853507803, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.29810487, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.2776405456, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.0941061242, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1369603584, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3335388003, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5276151436, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6871514991, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5322520826, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7271316675, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5276151436, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6871514991, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5276151436, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6871514991, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5523722682, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7471196628, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4961133462, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7296403082, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5276151436, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6871514991, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5274964121, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6941952619, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3763278728, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4745362241, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5523722682, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7219229058, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5002744991, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6429454825, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5523722682, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7471196628, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.3213275672, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4096177772, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5773184063, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5331034421, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6806929098, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3270534172, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6313546086, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.6144246566, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7550732449, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4958271735, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7377780893, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4958271735, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7377780893, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2238855011, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5288881529, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.0629502807, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3271734324, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.5831654195, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7601444481, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4679728964, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6053337914, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4730161463, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6981990328, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.5023049672, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.688514039, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.5023049672, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.688514039, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3363819044, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3649580098, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4568628393, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7163619638, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2680165156, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5590529073, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5470973835, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3602381155, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6357024906, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3602381155, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6357024906, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5563318425, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4523874747, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4653697322, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3200938205, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6393945963, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3803773679, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6906084512, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5478041898, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1888243784, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5789754713, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3200938205, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6393945963, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4701351186, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4342716445, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5260796354, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3047091549, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5428758122, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2893311641, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5798018459, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2614402196, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5270061175, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2614402196, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5270061175, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2994985312, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.61170222, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2994985312, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.61170222, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4376035091, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3127937309, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4874766694, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4184199372, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6644204177, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4259108629, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5685406244, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.316227766, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5331131422, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.316227766, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5331131422, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2659635195, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5819860704, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.1903786196, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5872021106, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2893311641, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5970102525, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.184589582, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3357871698, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.200389085, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3836585468, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.4868202184, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.536395072, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.4868202184, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.536395072, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1507167626, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2891630903, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.200389085, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3363470724, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.1081734092, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.6681082569, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.725747847, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2010537345, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3461597308, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1860533529, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3760221461, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.5998949117, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.6761932469, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.4859373819, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5468690247, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2051569194, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.5398995685, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5601040209, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4275341525, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4126375622, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.389264619, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3964051687, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.144821893, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.366852953, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1670329771, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.478327038, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.2739399901, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4227538624, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4232731925, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.2960731972, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1452362661, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4729236733, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1759326237, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.6193592475, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3889473075, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.1915653719, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3447932071, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1751062735, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4414706046, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3742996442, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3150504545, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3361093415, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3680683341, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3574029228, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.383541535, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1440453111, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4724943997, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.3077874158, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.448041448, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.2744668545, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3540230246, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2167710345, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4369788277, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2608721373, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4425523568, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3771475821, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.2908987134, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3111260879, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3896462403, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.2919152113, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.2919152113, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3074764316, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.2322024582, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.1558741392, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2263779158, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4614091659, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1974060384, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4392402072, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.2876656267, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3597494652, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3564249821, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3526827693, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.0139373362, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4256815036, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3453786558, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6888865426, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4994359587, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3578835436, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5503287051, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3578835436, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5503287051, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.261201334, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.2502511779, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.1110460197, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3725748409, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5408894513, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3559739463, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5408630325, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.2910873659, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6726279357, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3259889346, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5117673951, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.2167545321, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5731679833, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.1423071533, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.3546151079, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.1531682455, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.3155588395, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5004428569, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3191922067, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.46967595, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3191922067, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4322938743, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.2881185954, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.2881185954, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.284160485, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4011088672, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3936919393, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5367684136, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3047091549, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4567989668, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3792611112, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5498654958, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3015899198, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5407786458, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3132259425, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5703202725, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1189477267, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.3633504363, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3163032924, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4566752559, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.3387725036, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.0039872408, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2837655733, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4099902894, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1387736505, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.400180049, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3312615529, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5044209916, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3705911955, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5193244779, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.0963782232, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1823990545, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.425309437, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3424536496, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4759175046, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1998881565, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4045022212, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.5770362357, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.6448162735, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.5596234868, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.6146584646, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1983977401, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4228960291, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4036833691, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2521409599, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.459685864, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3383930155, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.2514130629, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2961516536, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.498582506, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2878333694, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5587364816, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3642301319, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6103580099, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2447987985, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4989995992, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2447987985, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4989995992, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3642301319, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6103580099, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2199382612, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5016488706, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.2651383006, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4460975519, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4419435975, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1470815798, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4857421015, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4894541275, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2376956048, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5396996022, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.2992831986, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.276654641, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1203080339, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4034365089, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.3308548467, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.4135995626, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2204887282, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2900060977, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.1496284837, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2335293, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.1667955161, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.242949285, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2646015952, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.3157063697, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2307712508, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2871523535, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2153820205, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1969801488, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.3541296817, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.4347460768, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2697856976, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.3242134827, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.1587572218, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2121588114, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0369267533, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0924167732, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.3308548467, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.4135995626, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1597972731, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.3237722713, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.3325894778, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.4033582073, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.4663100468, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.5549270001, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.5679891636, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.210616616, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2530915651, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.229790895, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3353527175, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.229790895, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3353527175, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1409882908, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.1818723447, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.457015118, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.4827101977, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2344257726, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2858983662, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.4223157403, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.517518937, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.6061105882, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.6319310382, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.465075508, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.4753776302, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.157560095, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.1917949409, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.3174875225, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3324201738, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1756788504, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2932341322, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.0990075369, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.81647957, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.8378701011, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2634592129, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5830409447, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3032929625, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6298789413, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2638064752, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5568746681, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2638064752, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5568746681, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2634592129, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5830409447, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.467013158, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7437638564, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2505523539, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.586369645, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3032929625, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5928831842, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.4908301093, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.8148280158, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.5298537181, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.822748932, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3074203461, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6805350757, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.412475066, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7230635818, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.4300000761, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6769226621, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.2603279434, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1509425812, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4957807155, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.3409360571, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2382939784, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5141279223, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2168880192, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5164502019, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2168880192, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5164502019, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.3913943517, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4335409233, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2206023613, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4722706296, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5039471119, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4962271754, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2105946974, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5326130101, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4450357968, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4828640829, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2853837111, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5109111081, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4175420834, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4911355432, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1633647013, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4295267613, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1190200191, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.370068692, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2066736214, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4333016516, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2066736214, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4333016516, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.2322019808, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3138982087, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.1884575364, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.2797941129, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2567840481, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4780963115, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2507378339, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4157511848, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3073899154, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2404817939, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4185563869, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2404817939, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3887778043, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.2017861586, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.2894670684, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1260716212, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4021408353, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1691896235, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4942911926, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1312901848, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3768713475, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1320400322, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.370691868, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1347176685, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3119115134, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.2091051621, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5402831898, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.166451727, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4173599375, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.4545984911, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.6246203671, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.200409452, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5452353998, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.3244913215, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5736635347, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1333675348, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4153642805, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.159490805, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4475133264, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4451296305, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.1150380469, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1323229159, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4925850413, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1998106449, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3919499606, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2904137617, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4440271886, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2909755167, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3877276005, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2909755167, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3877276005, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3762332647, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4417327887, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.361202704, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4275489501, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3107474604, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.374539283, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.376523994, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4474954197, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.376523994, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4474954197, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3784541381, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4493430485, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1978989004, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3035656856, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2788279514, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3921594574, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1741601768, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3262568204, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1805995719, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.2915951586, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3973226531, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4578339802, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.196092583, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4573617031, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2806155761, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5604571547, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.2778391283, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3612052785, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2819962476, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3738706208, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2109499741, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.391394749, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2095755691, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3184778945, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.3401642409, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5639990182, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2573056186, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4658428635, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2308701797, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4107166381, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.3395866013, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5379135197, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1157917568, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.426003858, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1885540698, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4726960576, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.1075151207, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3802834642, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2633905722, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4436643088, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2722704374, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4630549376, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0831979423, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.321471912, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0151087256, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.10794551, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2845621581, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4526033317, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1727833085, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4344972437, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.1116181547, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2516546237, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4903570071, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1572307859, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4181020983, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.121182928, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3757003782, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.4044473372, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.6027382653, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.306542338, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4638359231, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0861997107, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.2734884081, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.225175046, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1855520929, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4175056582, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4700695381, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1325451215, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4538619158, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3051552202, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3051552202, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2487541869, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2668685259, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.1130518279, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1692731897, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4389579379, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4177661286, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1221966748, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2978425655, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3581478583, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3897036061, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.203230076, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.0354636522, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2623065461, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2470891386, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4688632266, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2560635442, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4780977367, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1070100623, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.3553402192, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1070100623, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.3553402192, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1763123087, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.409487163, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1763123087, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.409487163, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1643614815, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.3973520284, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1065411344, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.3734232993, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.4126320391, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5775573113, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.420636567, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5802713366, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3119177701, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4735355879, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.181358579, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4187138915, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.2875216154, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0844777374, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.2971141035, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0803651749, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.3508089296, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2303529812, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.6014508178, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2704657013, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.6186468607, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3043357146, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2309660688, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.1816989222, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.1097070444, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.1155618472, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.3962645069, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.6785332348, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2275603078, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5355940888, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4088500715, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2031394366, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4983563771, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2196153014, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5749676939, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2638014881, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.1097070444, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4472084731, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.286272925, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4498943788, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2002273124, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4215148871, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0112683186, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1035363157, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0095826229, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1021959772, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.0983140277, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.0191508627, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.117952324, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1884697863, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4536070914, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1500493128, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3450393291, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.2985531163, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2910873659, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.416717715, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1586578315, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3481222132, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1424719516, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.0219736974, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1297499898, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.8492326636, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9063898435, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5360330313, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7676864591, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5309354663, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6756014233, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4529852872, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6941474239, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.8522456714, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9096914044, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.945741609, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9892952933, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7912619864, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9129058872, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.945741609, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9892952933, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3138372014, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3589660908, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2074813196, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2716205232, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1725834133, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2676886315, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1725834133, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2676886315, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2562402499, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.346213232, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1302040624, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1949478708, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1575186828, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2201696287, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3061357456, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3616235652, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3061357456, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3616235652, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3061357456, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3616235652, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3061357456, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3616235652, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2980986168, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3657032295, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.18056557, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2929008842, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1277700534, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2084699145, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2598534196, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.346213232, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.6153267327, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.8254407085, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.4135171, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.7050151549, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.6907573116, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.9077913232, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.6907573116, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.9077913232, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.334579461, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.7523344918, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.6179396438, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.866516296, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.609920244, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.4699739598, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.8114935753, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.5602926889, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.8525951198, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.4699739598, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.8114935753, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.4547722461, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.7936318117, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.6179396438, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.866516296, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2227227312, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4637652511, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4433857597, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3453786558, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.6736450219, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.6976333496, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.8331572108, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.6976333496, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.8331572108, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.6976333496, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.8331572108, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.6976333496, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.8331572108, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4024582794, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6664090182, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5478437342, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.775208669, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5721869364, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7849794665, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5440766841, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7530101165, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3623885503, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6357079238, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5440766841, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7530101165, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2244783658, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6359627082, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2245435939, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6008671717, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.653781376, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7617489761, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.396412218, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5845407346, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.653781376, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7617489761, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4987046236, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.647874639, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4987046236, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.647874639, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3065411776, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.507825049, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3065411776, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.507825049, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2280299254, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4447177675, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.5069147001, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6481561033, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.3078333887, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4987046236, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.647874639, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4987046236, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.647874639, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4549681529, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6164314607, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4987046236, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.647874639, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.45686927, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6147353969, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2081154202, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4040637852, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.0623135743, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3501235877, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5816664251, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2622716439, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4238491589, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3521082926, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5239651687, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.248317576, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.422411579, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2550784982, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4139069374, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3873284108, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.355669645, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.504350739, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.283078907, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4900779363, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3069033694, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4638073591, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.236320096, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4543479994, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1946452196, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3858404261, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3554837744, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5150536107, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3554837744, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5150536107, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3141039699, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3509809687, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3856185982, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.8330787011, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.9482515348, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.8330787011, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.9482515348, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.8330787011, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.9482515348, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.8330787011, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.9482515348, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5815699185, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.8158797977, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.7216597075, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.864764916, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.7637483416, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.8894308321, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.8330787011, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.9482515348, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.8330787011, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.9482515348, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.809701385, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.8896806149, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.809701385, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.8896806149, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.8330787011, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.9482515348, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.6161420984, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6945809713, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.8330787011, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.9482515348, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4933292241, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5118244302, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.5805399561, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.481046426, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1576498058, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5717865334, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1576498058, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5717865334, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2151061847, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.413802455, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3489214645, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4328796143, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4308163115, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4953960513, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4472888097, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4742664049, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4602272933, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3489214645, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4519496201, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4953960513, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4472888097, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4953960513, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4472888097, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3917196589, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5550595585, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4825434542, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.5617848264, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.557088675, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4996136935, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6351045116, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5064127216, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6516332048, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5064127216, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6608872773, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5064127216, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6608872773, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3531901509, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5822934956, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5273318485, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3532802306, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5839265502, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4988543287, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6436097366, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.34773856, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5870908285, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5064127216, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6516332048, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5212982931, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5212982931, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3732103775, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5997537786, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4647137781, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5064127216, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6516332048, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.351387494, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5704306601, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4592978566, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3299895473, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5059431864, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3299895473, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5059431864, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2945642545, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.569135833, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2945642545, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5597065389, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1711201882, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4553723133, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4655035539, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.6467306329, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.173171112, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4960809753, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1508336427, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4714472446, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2537619201, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.471995155, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2679646242, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.541666384, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.357102986, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5866468421, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.2634988971, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1251432874, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3496183606, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5187615227, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5187615227, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5199744507, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5199744507, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4397936464, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5197498882, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5199744507, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3981441759, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6510906999, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.1965085477, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5134302168, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.1965085477, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5134302168, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.1739898488, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5216901259, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.189602679, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5147057623, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5199744507, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4899417818, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4916235565, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4477845944, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7043336945, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.5129586382, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7857394056, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4477845944, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7043336945, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4477845944, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7043336945, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4822245596, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7511716304, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2078053264, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5406521594, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1928860044, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3923428792, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.5106109398, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7688046995, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.6725157402, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.8704716257, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3494188592, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7072510224, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4544489098, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.8155088725, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2769348116, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6775019274, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3012697212, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6712254595, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3969347873, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4824766987, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7665355959, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.6535194995, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.8909391457, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.6535194995, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.8909391457, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.6535194995, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.8909391457, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.6535194995, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.8909391457, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.5088645485, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.8116199676, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.6158161555, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.8568982836, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.5088645485, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.8116199676, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.5088645485, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.8116199676, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.5088645485, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.8116199676, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.4062749424, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.771757818, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.5088645485, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.8116199676, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.5088645485, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.8116199676, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.9390825256, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.4373266725, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.7265900332, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.681092017, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.7298378378, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.8542310686, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.5852187597, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7147018027, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6317498623, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.8119634169, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6317498623, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.8119634169, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.5852187597, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7147018027, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3956955502, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6546777917, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2615311775, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5846059223, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.7483293841, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.8146526693, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.8151678596, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.8873630456, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.7483293841, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.8146526693, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.1139232219, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4512595976, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6268498244, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.5852187597, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7147018027, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.398821617, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.5852187597, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7147018027, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.154023164, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3618269859, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.368224131, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5606184355, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3071747168, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4836163769, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3071747168, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4836163769, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2765950321, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4432072464, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3619724421, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.30814988, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.368224131, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5450474312, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.368224131, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5450474312, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2024802785, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4353181305, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.368224131, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5450474312, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3562070893, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5293559991, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3262024391, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4654796792, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1741578467, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3586870164, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.368224131, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5606184355, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3733886407, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3821642644, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4146932034, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4146932034, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1447953616, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3672186527, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2615311775, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5017688443, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3398181363, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2559035608, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4786634069, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2615311775, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5017688443, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1821604173, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4452929994, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.1576364753, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4448919225, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3598763208, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4724255276, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4444961493, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1591178311, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.439170067, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3162730677, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1446920532, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3906385227, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1415394535, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.378903203, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.2991385301, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1892240569, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4132993503, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.0166424835, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1601280792, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.36708967, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1627934873, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3909559745, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1523624986, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4850388212, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3264336473, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1405461328, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4001732894, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1731187888, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.378736994, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.2369690015, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3151957247, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2597064971, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.6796677377, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.3348865558, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.7293017619, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.3079852791, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.6441930748, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.3791621113, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.6955940763, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2284805641, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4641255317, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3271608625, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.396374772, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.3719278006, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.6892896282, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.437818694, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.7710721801, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.6289868867, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.818026119, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.6289868867, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.818026119, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.407135992, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.7697196337, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2111187176, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5500149009, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.252922256, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.3639412531, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.6558757084, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4572935209, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4768283302, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5067583406, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5067583406, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4572935209, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5424577954, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4883223607, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.453655627, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5067583406, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.401755206, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4095191931, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.453317979, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.453655627, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4039245319, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.44779059, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2115210387, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.6675194677, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3268514139, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.7037076426, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.430125687, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.7706340594, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2930010354, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.7440537717, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2465903845, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.6742202737, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2371332025, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.6907833611, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2256490809, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5866569481, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2363339974, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.6998524249, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1475954395, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.6528001651, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4957546541, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.2443461513, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2997691104, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.7186712721, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5852108991, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4437453763, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1150950994, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5614517727, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2085311124, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4435193095, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2175445226, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4621999155, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1425316777, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3600387581, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1425316777, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3600387581, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.206233703, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4218885358, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1598710593, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4326511029, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1507796145, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3926830609, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2175445226, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4621999155, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2240812633, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4635198585, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1941671706, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.400453861, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1535873584, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3955148125, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2085311124, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4435193095, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2287219601, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.503938018, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.2256250446, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.314124942, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.7948343661, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.7747058711, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.7948343661, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.7747058711, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.7948343661, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.7747058711, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.7948343661, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.7747058711, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.7948343661, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.7747058711, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.7973454775, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.7689312469, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.483123361, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6532633715, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.7948343661, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.7747058711, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.7948343661, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.7747058711, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.4867643692, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6460761902, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.7948343661, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.7747058711, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.7948343661, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.7747058711, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2814017327, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4963305768, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.7948343661, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.7747058711, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.6941268298, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.7232925117, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2868823615, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.3058846234, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2438857596, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2438857596, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2412383494, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.3058846234, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1715463764, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1757108909, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.222625002, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.1887792103, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2176061023, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2979981211, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.292037003, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.4216533376, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.4039571839, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.4182495832, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.4118425863, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.1923018801, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2490706726, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.246450137, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2775164476, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2358729324, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.5951888719, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.5197696051, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.1850334785, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.6368556588, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.5984210128, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.6368556588, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.5984210128, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.4269013796, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.4438371473, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2171245797, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.3121192034, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2979941092, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.4983116255, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3705486617, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.1988908086, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3279525548, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.0699910525, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.1576043697, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.4578730121, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.4763409765, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.3210886806, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3500722731, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3324024618, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3259497462, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5361018684, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3190887215, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4863428829, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.5034231828, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7006437933, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.5034231828, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7006437933, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3534548116, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6000869745, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3626305461, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5939784604, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3622755744, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5653237161, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.5526778778, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7267402732, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3626305461, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5835071609, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.368528912, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.583972703, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.0712014958, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.3048128701, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.5034231828, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7006437933, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2147607499, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5078156365, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3340392563, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5319774707, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3626305461, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6179355732, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.5642137945, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.8202028423, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.6298777848, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.878403256, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2999242985, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6283146443, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2999242985, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6283146443, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.5214131583, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.758561428, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.5464711341, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.7864029397, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.4702215641, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.7153092714, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.5582220192, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.8140951455, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.5582220192, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.8140951455, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.5649285679, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.8161130615, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.5577288804, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.797404658, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.5577288804, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.797404658, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.5988044702, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.7681690981, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.3713830979, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.575116764, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.8407226006, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1040389688, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3115334232, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2852552909, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4078282862, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1962972276, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3201823353, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1962972276, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3201823353, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.2782546339, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1260969365, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.268740791, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.1645803633, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1956833643, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3723430987, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1472461905, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.2839286654, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.274869025, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2283070458, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3919468076, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1670454255, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3413132323, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1338261308, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3051903485, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.1469456765, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0854157565, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.2185661833, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3948949529, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.2320305803, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5875457251, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.367865978, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.367865978, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.395842947, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3593318823, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3064223068, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1656456532, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4536039872, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.2476165058, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5724037748, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.2945642545, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.6037213667, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3916729633, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1240959712, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.46250912, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3846659308, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4113262407, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1225914996, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4797495741, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2374993748, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5186241424, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2293648308, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4184099074, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1298267945, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.359885149, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1298267945, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.359885149, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2583858838, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4449030747, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1518454357, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3316482536, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1503474482, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3379957017, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.6007525447, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.7052132029, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.4918887915, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.6514476893, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.4640531757, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.638469834, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1501665011, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.382731387, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.268229744, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5226016851, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1306462286, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.2984123772, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.1968584727, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1291353308, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3699122403, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.255791467, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.492035644, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.3759566299, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5278838809, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.3764925638, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5986485546, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.3764925638, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5986485546, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2460137258, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5651300594, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4252443016, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4389754418, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2141398901, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5141525253, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.5162619435, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.7117190162, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3964543811, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1927369156, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5652312627, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2287868433, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5910527597, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3937601061, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.1116581774, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.4593840569, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.614452372, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.348179092, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.554627493, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.512948431, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.6268186945, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3977135991, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1299191651, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4425861065, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.3152093059, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5618098982, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.3563054845, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.6285749485, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1661865517, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4875519644, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2556795749, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4986688668, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2278350766, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4991401821, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2724128236, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4452104733, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.043407736, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.2601621161, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.4390960898, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.6485099247, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1551155009, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4014314464, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.2943579103, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1890425468, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4992010055, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1330844253, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4188741469, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2311466382, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4894179053, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1629944673, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3208008659, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2232587706, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4093357711, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1185666012, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2738204428, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0653487851, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2822867499, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.0117896748, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1544875931, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4246935696, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4051787938, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3855365289, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0262916122, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2325340468, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2122363344, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4389052935, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3149190819, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.0282062466, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3621071214, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3702730402, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.649647473, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.322821388, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5545363549, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.322821388, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5545363549, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.322821388, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5545363549, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3702730402, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.649647473, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.322821388, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5545363549, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3702730402, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.649647473, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.322821388, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5545363549, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.322821388, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5545363549, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.322821388, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5545363549, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.322821388, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5545363549, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.322821388, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5545363549, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2810335396, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5956686674, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3702730402, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.649647473, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.322821388, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5705123444, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4079273559, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2520126751, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4174826402, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3172479411, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3172479411, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2255009729, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2079988964, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.1903468696, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2861555645, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4803502935, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2520126751, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4174826402, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4078425162, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2861555645, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4763638923, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2424854514, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4373335888, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4130305817, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2079988964, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4508926953, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3469824958, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2286960005, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4746698508, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.0743900144, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1720101243, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1196268811, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1316613918, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1629057628, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.3674817321, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.5111850167, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.247019913, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4634617667, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.5696705282, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.6515641575, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.3182485155, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.534549633, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2507378339, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4260818847, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.2918937159, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.0041113189, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.2259609948, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.328872375, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3914273317, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3450219163, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3993348853, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.4267049357, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4223884413, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.4267049357, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4223884413, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.309780685, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2829527445, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2922290433, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2723003397, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2922290433, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2723003397, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3567464687, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3651755892, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2548454457, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2714025628, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3349838928, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3296536654, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2368693822, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3209099892, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3942831699, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.476356889, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3031148374, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2870689861, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3223833287, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3947515838, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.4614654877, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4019452398, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2930072899, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4620516485, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2562150246, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4704647783, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3545085634, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5387990403, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3545085634, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5387990403, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2718284968, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5497265771, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1200188581, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4122127192, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0956774578, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.2538064061, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.4544505188, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.6033006988, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3509258729, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5379703355, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3509258729, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5379703355, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3893626377, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5443518219, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2767438562, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4593243771, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3893626377, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5468468646, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.285557535, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.341644556, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.4049402235, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5871644978, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5521710658, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7317828776, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5521710658, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7317828776, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5521710658, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7389181447, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5521710658, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7389181447, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5521710658, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7317828776, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4226108217, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6493613257, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5521710658, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7317828776, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5521710658, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7317828776, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5521710658, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7317828776, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4226108217, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6331414172, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4226108217, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6331414172, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5521710658, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7317828776, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4226108217, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6331414172, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.6028670503, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7367363357, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5521710658, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7317828776, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.5582486914, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6678493404, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4018202851, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6003256952, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.8406763479, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.8871517154, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.8406763479, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.8871517154, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.6666823117, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.7571125339, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.697724039, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.8189844672, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.0101912475, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.5406438522, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6520694801, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4018202851, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6003256952, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3864572432, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5849342936, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.697724039, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.8189844672, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.5793367581, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.7675449146, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4847079074, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6505709784, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.7019499719, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.8450280883, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.7397087418, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.8865031415, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2042283847, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3821382671, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1820705281, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4504432022, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2091008288, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4538036435, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2091008288, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4538036435, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1429117357, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4518436099, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2205920203, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5084868417, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.1008758834, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2599542518, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4909892942, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3099627272, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5091964648, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3441951473, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2128497675, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4385912276, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2383234074, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4365254352, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2066736214, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.445862695, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1617059616, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.2774366226, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2108185107, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4042801758, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.6425503167, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.807889193, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.7181417753, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.8029162546, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.7181417753, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.8029162546, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.6425503167, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.807889193, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5970228994, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7623592429, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5970228994, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7623592429, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.7629273293, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.8510385545, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.6425503167, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.807889193, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.6888074583, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.8055061208, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.8725129388, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.9495292424, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.8725129388, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.9495292424, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5970228994, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7623592429, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.697842929, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7717858931, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1818958799, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.439640804, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2147607499, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3976144917, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2745762486, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4360301196, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2745762486, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4360301196, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3941175366, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5506555497, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3606781489, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5071206995, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1896550847, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4310936955, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.649530856, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.7114963535, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4058951764, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6149515962, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3339087646, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5995623358, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4122974403, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.617091169, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3267294026, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5803377043, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3785572829, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.2643854379, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4066689638, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5267604642, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.8253498773, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.8529564805, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.7944837206, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.878453174, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.7072172848, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7914639887, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.7072172848, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7914639887, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.7944837206, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.878453174, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1755381218, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4419744153, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2633201939, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5893220054, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2388752792, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.592499369, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.5394044744, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.7201188408, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.5394044744, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.7201188408, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2745762486, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5730023383, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2961516536, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5798430117, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1410157688, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3599849516, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.416179145, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.6046852394, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2808924132, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5475272889, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3070898761, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5791648909, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3160022915, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5374439094, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2169036581, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5019141381, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.0094944404, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.277333106, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4703077247, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.7203673717, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4369942407, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6009573115, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3009687072, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5341810386, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3009687072, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.533217285, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3009687072, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.533217285, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3140382294, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5631437829, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2281684904, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4984990869, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3140382294, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5631437829, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.7498810286, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7726337965, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.7498810286, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7726337965, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.7498810286, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7726337965, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4167743223, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4167743223, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.8318180062, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.8641903026, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4806216298, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6311658995, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.7186969684, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.8143071708, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1549509688, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4542126326, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5138104165, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.5123350306, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7719555466, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.5123350306, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7719555466, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4209973458, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4355615888, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3548263686, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2451829992, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5623282316, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3461335863, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6386405249, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4773779563, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.22119423, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5855963149, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2009685362, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.592296223, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1951419302, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.50962135, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.2772639582, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.5194247347, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6585810035, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3550420051, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5693079918, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1794560313, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5236301265, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1794560313, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5236301265, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1799107865, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5159811845, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4596307297, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1799107865, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5159811845, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.2423268307, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1794560313, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5236301265, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3550420051, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5693079918, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4596307297, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3550420051, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5693079918, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5052082359, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1799107865, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5159811845, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4492950043, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4608738249, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6325987025, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7966336958, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6486932415, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7886867104, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6325987025, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7966336958, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6325987025, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7966336958, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.5694299147, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.716197428, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4601221425, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6704634783, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2904276736, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5945109732, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6486932415, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7886867104, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6486932415, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7886867104, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4983116255, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6906247423, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6486932415, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7886867104, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6486932415, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7886867104, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.5694299147, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.716197428, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2624310277, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6025429011, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6486932415, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7887116805, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3905727762, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3934016322, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.4393709545, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4618172168, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.4713668887, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.487556786, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.4713668887, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.487556786, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3246935344, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.411859573, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3754749997, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4281102173, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2951855723, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4165838257, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.7490853969, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.8062091543, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.4405559459, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5608379078, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.4462203715, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5604772872, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.7490853969, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.8062091543, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.7490853969, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.8062091543, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.5196976495, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5405459272, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.5054091116, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.6683122486, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.7378351342, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.7822638455, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.4240649322, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.6515479761, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3460178708, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.477718258, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2200497519, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3580799709, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2200497519, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3580799709, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2331039707, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4183718944, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2713164273, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.6108644122, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2028609724, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3641531894, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.4772349067, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.6979552346, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3214481224, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5957892992, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.404199615, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5081120457, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3371021562, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4921159236, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2206635049, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3982161812, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.4220575162, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5679415458, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.2411874286, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.7000942696, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.7771546906, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.6054657751, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.7275033089, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.4110385147, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5051296805, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2989834109, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3436978703, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2989834109, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3436978703, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.4290255654, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5598340094, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.3910016226, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5825568684, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1691795448, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.2486182031, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.4535939334, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.6211966673, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2487667554, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5735144785, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.3042060838, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5646760672, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0590906756, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.2991475814, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.4458819273, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.6326308722, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.1937825697, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3758589988, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.3626305461, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5172467981, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.4093632137, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.7444177757, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.3680806214, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.710671769, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2373131971, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5661601914, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2373131971, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5661601914, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.2038395883, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1285486554, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.2904130695, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1186565985, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.2933615613, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.6879419394, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.9251514069, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.6248651455, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.8644374396, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.4972358703, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.7738363286, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.6508430036, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.8046848309, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.6879419394, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.9251514069, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1193019148, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4570974492, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.1407230163, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4881069342, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.6102624547, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.7455382911, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.6102624547, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.7455382911, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4949431899, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6525478644, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4949431899, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6525478644, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3961867597, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5900232243, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.2875699962, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5623490068, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4717991357, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6368175529, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.6102624547, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.7455382911, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.6102624547, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.7455382911, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.6584518249, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.7894751022, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5936781017, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.7268454525, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5129914365, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.67190581, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3911295456, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.580008972, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4376250019, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6229933227, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3961867597, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5900232243, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1260716212, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4374864219, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.422195902, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4089778297, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4089778297, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2018577358, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4662742922, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2801260476, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4918406628, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5137576862, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2444764055, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.529751265, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2698809072, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5827120909, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1180263199, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4888836707, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2290810143, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5037331051, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2510015043, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5078973713, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.3487239705, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.307711206, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1855551502, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5078671061, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1693985, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4808428624, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3557389634, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4337384407, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3830947998, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3830947998, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.4438335184, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5658578761, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2612246289, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4622733885, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3648271772, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.6036552406, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3040052735, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5563245065, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.4758104038, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.6192989319, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.4002507454, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5277651665, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3182356622, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5315680645, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3182356622, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5315680645, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2401497351, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4758492311, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2513491515, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4837504343, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3333887486, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3896967385, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.4290255654, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6542302593, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.5438653755, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.730264991, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.5438653755, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.730264991, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.5438653755, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.730264991, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.483813463, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5124459841, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.1818824338, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.6612116052, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.7760591039, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.5438653755, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.730264991, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3060368951, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4831305032, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3217816921, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4853985554, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.4260146736, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6715816584, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2615311775, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6168046788, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.515295825, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5435363281, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.287558382, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.3019039432, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.4790145581, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.4292907667, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.3226647471, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.332782094, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.3221411249, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.3304616882, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2514173514, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2894639942, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.4546697237, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.4460520025, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.2566290207, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.284458041, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.3179303998, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.3849979752, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.1591178311, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1644514383, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1931328231, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.5426552584, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.5035808317, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.3968302282, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.3941633569, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.4592806798, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.4065020472, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.3702794921, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.3917352141, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.4790145581, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.4956337511, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1423071533, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2479651047, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.171404917, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2274892285, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.5216690821, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.6663479473, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.5216690821, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.6663479473, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.3461876786, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.4375133562, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.267434228, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.3325845097, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.4518184436, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2527045558, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2975752324, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.3292010361, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.4311130505, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1823935085, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2213631609, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2347788343, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3032766574, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.5102002549, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.5481850559, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1714814357, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.267715555, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1832567181, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2734729855, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1709686261, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2258634618, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.5194247347, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7440660672, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3902273664, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6827449888, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.5194247347, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7440660672, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.5194247347, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7440660672, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.5194247347, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7440660672, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.5194247347, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7440660672, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.4303767738, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6909233597, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.5194247347, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7440660672, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3902273664, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6827449888, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.4884391792, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7061627662, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.5194247347, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7440660672, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.5194247347, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7440660672, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.4093184131, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6844082267, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3309468095, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5082966624, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.5194247347, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7440660672, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2910873659, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6461260377, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2426823579, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6128667394, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3324968566, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.637090237, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3324968566, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.637090237, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.430833096, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.666084073, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.5051836989, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.704730777, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.1661641123, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.452625307, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3020584686, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6431625523, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3014785663, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6165177251, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2868578078, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5505861134, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2863070881, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5730343145, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2026478724, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5428362111, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.346575619, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.3185890262, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.1767958813, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5270697006, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1731670346, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3548551325, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2434623104, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4426541296, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.5245322415, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5814854114, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.5245322415, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5814854114, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.3489214645, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4443581707, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.4265706803, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5676570549, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.3496172236, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5137611857, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.3654749252, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4608305787, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3131480144, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.305369417, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4636765045, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3269822513, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3282397523, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.275932417, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.444000519, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.305369417, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4724348642, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.241258805, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.453663999, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1447953616, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4245184965, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.3725748409, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5542570357, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1415394535, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4269729411, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1415394535, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4269729411, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.2047265841, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4847881164, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1416796612, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4091413883, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1034486877, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.2279301588, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.2066418182, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5143883509, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.114343382, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3547078108, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.2676032276, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5128827077, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1373727917, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4126418547, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.204212837, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4468235873, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.2235444509, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4592148484, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.1808267864, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.2719559269, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.5350448626, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3459299125, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5677282057, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.4277006994, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.6058578812, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2252602156, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4823460203, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2252602156, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4823460203, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.6275541561, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.7316294989, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3954642332, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5607387096, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3442680114, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5316720524, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3943890899, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5760332857, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2228855265, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4870161291, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.4070190836, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.594990406, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2904979371, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5660059777, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.353425281, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.6247144454, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1925903911, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4507828539, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0994152781, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3375800401, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.5942391704, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.7043046273, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2543786874, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4748216333, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2962225457, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5178269067, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3845687306, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3845687306, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2901334758, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5229103696, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1916664299, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4535240584, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.329783721, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2962225457, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4935676335, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.3066439134, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4831982874, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2991528889, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5582453238, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2139991547, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4401240521, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1968170324, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4641799487, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.011704494, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.2439145014, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4188399581, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5397858291, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5616963281, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.2734404217, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1014524997, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.2953987627, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3946720317, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4361039803, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5269731605, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1617059616, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5772772631, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1354715471, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4084064274, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1600872496, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3979154668, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1923018801, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5927843365, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1923018801, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5927843365, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.125778296, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3358649233, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3981211857, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3832762644, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.5063945135, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4265686082, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2442205734, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4745686548, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2842110364, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4520674721, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3092676946, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0417186641, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.1977428894, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.0027777778, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1754386006, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4767496409, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.3619317454, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.5603087309, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1710145669, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3139687441, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1931333551, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.5370585235, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.193370065, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.6117839592, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.3216122772, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4889481342, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.0399995338, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1429571794, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3964733871, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.8843865925, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.954691025, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.6396679416, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.8130954822, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.7071067812, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.8568176228, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.7071067812, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.8568176228, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.6396679416, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.8183519586, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.4302123694, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.6691232303, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.1736516518, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.7071067812, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.8568176228, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.4468947264, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.6588405896, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.5741156866, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.7600101686, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1207417279, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.3854432348, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.7500901713, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.8624598551, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.3280740637, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.189755167, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.546736489, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.8843865925, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.954691025, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2760258065, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5170713394, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2591641361, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4862581532, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1824016291, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5287419988, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1824016291, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5287419988, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.273711132, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2698078272, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.1950703465, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.3491985989, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.6696429767, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.3293405971, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5811461545, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2872797668, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4989885393, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.034132794, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.241255137, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2724974523, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4904389092, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3175607297, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2065880469, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.30376137, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5498110282, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3522386575, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1956943486, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.5843699613, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.0261640528, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.0261640528, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1955775564, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.0186862372, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.0800897361, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.3081206097, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4526756958, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2928298014, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.5433026792, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.31214673, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0822277974, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3335295895, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.3005283408, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.571668028, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.0433173254, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.0065308255, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.2250920759, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3430416312, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6383283286, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4471101337, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7319347493, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.0941071492, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.2236254279, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.1406005899, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.3205132146, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4275810015, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6481070648, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4424906783, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7213459154, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.2847382405, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.5944159484, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5702655878, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.8232854346, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5627396124, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7683375756, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.464096196, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7474126325, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4280342552, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7260183443, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4361016862, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7150254604, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.2318334465, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.4876603712, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.2396296698, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.5138361143, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3597862823, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7212767938, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1775614884, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.213263691, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2478182819, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0740400946, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1352872342, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0899084549, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1652866737, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1239446094, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.26662621, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0911835227, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1259628326, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1073849785, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1843077021, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3053811566, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3388644465, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.172875056, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2485338203, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1489150477, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2618919111, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1406879778, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2422748846, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1439954854, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2528996799, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1487692721, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2536059289, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0411421284, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1070604518, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2641132774, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2898946819, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.116907413, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4498470572, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2577716972, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5171901208, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.1642415557, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.1781207588, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0463173253, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.2155848022, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.0062003968, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0935060462, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.343062921, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2563978475, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5733913952, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.251684973, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5441146119, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2328789695, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5168980964, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2464358581, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5459613463, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2696398422, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5506563869, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.0045787546, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.0045977011, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2332550586, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5039484226, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2447969757, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5213023099, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3274016884, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5570399656, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.1111409629, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.272397339, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.1196425814, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.3031655364, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2211880505, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4573855767, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.1690653646, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4758186156, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2708105005, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4950813391, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4514968876, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6166500597, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3887923655, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6140755433, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3994778575, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5617218896, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3191349967, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5329750657, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2931154738, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5385310894, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.1689139512, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4316682635, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0917566365, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.3249994057, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.16249656, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.463754244, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2529076741, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5430833248, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2073141914, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4360555837, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.2897852142, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.2603665007, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.08070632, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.3591167821, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2528857441, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5715569143, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.2953701029, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4221671352, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6302060108, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4545481795, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6054218377, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4398690431, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6046405926, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2496855702, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5511430757, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2864021858, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5777536674, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0783361496, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.2978243697, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.0360938345, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1939545119, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4832003622, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2826168898, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5075237417, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3235473266, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5441122251, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.045954679, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.259858652, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1678735694, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.2476163865, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2781578587, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3796663901, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.4678234352, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.6422853412, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2640379648, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4493814924, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3935019933, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.6071903248, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.4934119669, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.659007626, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3288143137, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5596092732, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.4122335242, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.6323888083, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.411744062, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5815106363, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2057680488, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3772312085, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1285890288, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3148709024, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1714086304, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3968141821, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3808405117, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7334510091, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.2651348897, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6029932145, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.0592362552, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.3156976516, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.120623551, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.3381143514, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4432782055, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7181569026, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3328272482, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6835909949, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.2646692275, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5971551168, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.6263164471, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.8520139045, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4940317096, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7362898909, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5112867163, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7497537018, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4667782255, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.775409428, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4667782255, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.775409428, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.2359102918, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.4623402888, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.1017793199, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.3335479382, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3459167763, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7155724078, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2378706072, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4963015559, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3860973951, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6271680934, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.1289969126, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.1025569341, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.249677568, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5596822855, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.315719768, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6311766763, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4216589318, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3644085122, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6157376412, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3969398323, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6236448691, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3804889549, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6349497388, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4324371049, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6305851138, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.439628918, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6487399259, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0989628189, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3761925165, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.0193781758, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1805414152, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4894585256, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1651086875, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4762714595, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.277103104, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5216248192, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.0597034488, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.2883367116, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.0450358358, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.2856990052, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3039981623, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5931856952, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2104028618, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5464826943, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2493264171, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4601227358, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4069614407, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6476222099, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3207863467, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6030950695, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3963106649, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6670602127, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2625805454, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.588680614, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3085738642, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6255460002, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2330150068, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4732064515, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.067970109, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.2715418133, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1956800786, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5228407308, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.205993173, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.449181248, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2047573901, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3934874463, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.1409108767, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1299314706, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.294599395, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1719646079, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3081027007, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2534555198, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4514808121, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0927886418, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.2907721235, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3517412854, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5232532816, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2998998433, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4520160212, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1168434319, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4029357931, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.282550796, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4828223683, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3308991716, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4942398467, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0688197588, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3087076022, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.2023651649, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1689706894, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3260914496, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2572958792, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5064333161, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.47307427, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6716818492, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0673082664, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.2395948756, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.1929800092, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.3770587836, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4127804219, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.606085875, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0287186206, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.0681956894, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2839852728, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5353252373, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5839068686, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7498987135, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.032316186, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.0183728179, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5681285983, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7443891531, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.391577424, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6438987111, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.505292264, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7104337169, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3990114071, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5456268881, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.1782721572, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.318306225, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3173241691, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5910464434, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1167574766, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4301556379, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.200572252, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4757636761, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1169017254, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.2524390505, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0753997529, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.30092388, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1078517242, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3886262537, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.092829996, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3602616615, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.08048862, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3883983838, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3025042122, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5314198518, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1977940633, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5032281717, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2674907183, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5237435676, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2102469208, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5403945195, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1280398106, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5140283033, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3130981358, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.0261043541, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1844923012, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4005834602, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2901976571, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5985964858, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3151295372, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6242597159, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0714597754, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.3042020079, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0748720597, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.3134735005, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2672991325, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6474323586, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2890449667, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.620578331, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1252109891, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.2534584651, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3486251971, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6519074064, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3128076344, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6051022696, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.5047460218, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6981561914, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2622053872, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6045462235, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2501418024, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5948201299, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2258043389, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5033553487, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0984195533, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.3327723903, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2615651536, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5337436258, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4629068057, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6888691117, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.529567245, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7151574135, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.0715078678, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.3509665568, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2173044897, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.457111046, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.332627185, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6707552233, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4196855486, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7433904632, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2894921927, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6202383519, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.5995826896, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7943692036, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6993946355, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.8854180854, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6176355988, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7898758503, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4475966482, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6848118023, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4559665634, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6856895897, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.1488773345, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.3502460666, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.3362531052, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.489967959, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6996203149, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1838690498, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3263831403, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2995728064, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.418242973, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1492027691, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2337251888, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1524132679, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2373874392, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1948950171, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3579044902, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1279236454, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3042229576, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2423936863, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3482875559, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2409168845, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3760904447, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1912320665, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3643868829, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2409168845, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3462564871, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.264681475, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3831294944, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2919568084, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4097202832, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2207605978, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.0088208669, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1753792879, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3388058024, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.062985749, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.0493721603, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2356808689, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.6055769872, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0705733633, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.2779498561, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0597646978, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.2948349203, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2841435865, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4668115397, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3192543939, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5392797997, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2923974412, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5000428321, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3593473105, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5947494544, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3754906253, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.6588309503, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3405968821, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5628429967, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.417145975, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.6924696605, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3086475776, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5998796998, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0640271886, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3469596053, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0332883722, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.0199232745, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2151054467, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4846454728, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1599118703, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4667629328, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.342598418, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5854661284, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.0427412331, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.1133793152, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1497426195, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3726183842, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1143588504, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3859556976, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1174036523, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3950281226, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2396995109, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4998009099, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1998403192, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4849010013, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2610554048, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4745587189, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.134560954, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4564753328, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.264863837, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5560242355, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1578188014, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3627260974, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0351981682, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.0159737507, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0437543663, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.0202620918, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1905758291, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4718416669, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1314770573, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4224745596, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0915776794, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3701460682, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0666980974, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.2189108945, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.1080306432, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.0776567484, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1350700255, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.2486435619, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2689259076, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5085571523, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2280292809, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5045187042, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0799899653, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4669430023, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2068663198, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5414930563, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2134728891, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5213180609, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3288154768, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0619525837, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.2081088014, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1692546646, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3398252843, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.2647140242, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6038381731, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.2058592651, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4968187716, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.1847269093, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.1847269093, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3017385988, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5195706056, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.1593794657, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4584545397, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.1573657384, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4353622003, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6713478367, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.2864240228, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.61081609, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4743785205, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.7078409133, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3456425407, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6437361453, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3045776961, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.616960363, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.3352630034, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.2848709355, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.1828247249, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.502733748, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1750028134, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4479057569, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2682764486, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5066876769, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1547981587, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.3205200487, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.2648573886, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0047730821, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.0829285531, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0487929609, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.1803124033, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0773094622, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.3543827361, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3583463146, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5970822607, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3084232896, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5533832756, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2728743752, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5680146925, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2605463938, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.56122305, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2920134077, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.569679389, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0985780246, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.3780554964, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.2318364308, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1672349642, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4598224414, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.2961060814, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.334876721, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.2115043097, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.225204085, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3055950801, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.102138899, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3287887661, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0854172444, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.2822077407, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.147173194, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3561339784, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0955025568, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3229718971, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1579668191, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4072792411, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3956940134, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1048205471, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3662621833, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.152323995, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.225421701, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.2727883585, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2652187704, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4100064315, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3876292814, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5446552031, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1536394124, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.3041152734, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1536394124, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.3041152734, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3033517807, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5110748652, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3043760556, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5831741447, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1125839096, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.2499701254, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.4177532956, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6150487016, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.4725288435, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5979074938, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.4843113592, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6440496752, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3836378227, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5763003202, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3908117282, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5754293697, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.269332646, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.487526439, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1333470842, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.3203877397, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.4238391936, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5611383065, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2193938326, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1896866854, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.076942623, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.076942623, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2098083111, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.274654869, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0730386354, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2225564277, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.1136832002, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.3049908147, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2659658765, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2323543192, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.1468128975, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.3160134768, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2853697461, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2244878428, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1069432982, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2970355353, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.3797470329, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.4784059073, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.3117257364, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.4516642139, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1878322123, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2946556433, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.014458963, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.3293405971, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.4512922498, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2576254437, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.464888454, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2532199665, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.4300207561, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.3901440609, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.4474502362, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.0325666424, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.3526878583, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.4468173562, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1665267858, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3242354714, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2184784494, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3923992785, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.237249586, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3582344175, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.0325666424, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.296983623, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.4617755276, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.502142941, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6919014525, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.4286493816, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6089294543, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.0722560289, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.2987832765, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.0722560289, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.2987832765, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.4397080749, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7141130991, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3135342426, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6210817766, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2580386691, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.3462095965, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.5617489124, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7727913933, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.4067676613, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6956515362, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.6728450602, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7864311691, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3717155024, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.6551663797, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.5215099215, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7532497199, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.3253454193, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4626445734, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1324062816, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.3439462036, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.4577369373, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.7101415565, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.203905703, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5710358292, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2469120011, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5942693442, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0911356222, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.3097682185, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0873716785, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.3058141483, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.136520859, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4761370326, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.1547487734, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.471235578, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.1095254278, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.27831284, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3042729202, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6316368244, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.4059763181, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6572798986, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.4327596645, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6405112836, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3768478745, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.7090128777, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3090595356, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6622367498, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.1314989462, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.3781558758, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0033887281, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.0435750071, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.236270008, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5323731887, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1101433349, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4112066557, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1543586922, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4415660381, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0722283717, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.2554932885, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0440249265, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.2455065001, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1378413098, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4211572192, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2487072043, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.57359744, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.013817288, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.1253644698, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.3457963946, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5975923648, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1444220103, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4879983173, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1062154905, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.431831434, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1719308255, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4713105639, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1780606498, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5082580772, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.2914965018, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0341015614, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.1264811292, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1970371501, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4326807387, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.0240122006, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0975771028, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4197518535, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.1211536982, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.1211536982, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0791188257, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3180943787, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.0180953987, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0359491869, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.2758632822, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1113631735, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3741979529, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1025915837, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4209327449, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0952806787, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3544690292, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0503876766, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3585941732, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0923081202, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.430027217, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0743936478, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.302371669, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.0041614648, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0696769961, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3006764589, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.4327667206, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5477430911, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.4516989733, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5415798785, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0818695213, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.2138900697, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0746802582, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.2295572629, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2770785255, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4017475844, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3980563459, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4826923665, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0989626649, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.2200451105, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.5433298898, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.6539235921, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.5092920821, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.7015498636, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.4868801988, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.6780031796, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.4807632521, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.6004276938, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.4386676743, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5540223699, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0164568053, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.0113890622, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1123381002, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.289567844, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.4864023522, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.6149323786, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.0482419698, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2980859215, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5278034227, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.2366706237, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3073763958, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1905454024, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4105353806, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2360968429, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.462761222, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1465568091, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3859099702, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.3895672787, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.6195204168, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.3509814894, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5555382602, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2395330056, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.474866392, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2705411345, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.6382727936, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2616587848, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.59737172, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0859388025, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3937606569, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.0190652043, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.0247076457, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1994337088, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5118140585, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0112018014, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.1635763278, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0187883141, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.1766291037, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.3688451939, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5612443054, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.4211918927, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.6000905799, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2192051106, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4746045892, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.5977584264, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.8063885918, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.6868497311, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.8147345978, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.4214953004, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.676585514, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.4738085398, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.7354659271, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.5010324053, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.6978436898, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0703917887, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3262556441, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.0042900043, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.224073181, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4499043165, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1050064614, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3190724849, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0969747257, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3745932363, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0426964776, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.1953624023, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.1680999928, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2738834401, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.0652741367, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.0691742923, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.4814827673, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.6931006882, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2916733029, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.6116293441, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1668870866, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4728485885, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1297018152, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4710457411, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2470990181, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4876426822, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0876721013, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3862741314, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0332883722, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.0184686436, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1169531715, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3888506294, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2369405784, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5263543432, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2525906861, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5384891409, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1472871073, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.3814445003, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.139839423, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.3782539243, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1182319143, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4539200739, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2349915412, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5277871994, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.2327860837, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3034604352, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5927380045, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2743845368, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.588948696, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2660988039, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5830233491, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2321593349, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5476657941, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2678221046, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.6016268776, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1147804099, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.3672482257, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0666849325, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.2624825156, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2636110629, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5611266753, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1054590577, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4263824758, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0956103944, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4101583288, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.203685511, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.203685511, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0093676828, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.0790202585, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.1270426994, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0784237277, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2577072248, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2017781982, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4593303345, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0928995102, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3765328871, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1633682039, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4801466572, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1123661641, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4689325082, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1110669149, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4872280752, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.0306349417, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.0264837893, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1373727917, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3592365999, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0936732577, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.2641613456, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.3471239643, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.5206611438, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1384005487, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0809938669, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1616494068, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.0111793123, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.0288531194, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0626826036, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.167879777, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.4663547689, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.6673933315, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2650114714, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.510913988, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1860799415, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4128480081, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.3276692206, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.5803713235, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2967631507, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.5149799653, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0089685782, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.0810223128, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.0150829854, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1339162191, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3410315731, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.1980316235, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.4080820823, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.2281684904, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.5295534281, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.1949624908, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.3337720183, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.1185666012, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.3380794186, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.2320305803, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.57193712, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.5146400882, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.491750098, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3407563026, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6182648747, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3226386416, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.5545705365, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.5196627001, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.2704817076, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.5452157068, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.2774870274, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.5366274702, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.1225914996, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.3778482968, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.332443736, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.3472164938, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1349246168, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1072112607, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1084572634, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1084572634, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2038848687, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1145859084, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.0800395257, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1621568295, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.265554308, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1441134994, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1497317899, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2143764617, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1463280553, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1524939673, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.014262007, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1155797724, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3916177036, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.6068458203, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3603321743, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.570786032, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2826845419, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5045089092, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3040559697, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.50579074, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3916177036, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.6068458203, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3916177036, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.6068458203, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2895011091, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.575615946, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3916177036, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.6068458203, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3916177036, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.6068458203, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.4588667801, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.6234514802, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3916177036, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.6068458203, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.4378159931, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.6143976527, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.0081551743, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1546540125, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4250199536, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3000455627, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5614823339, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.3744008469, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4141871474, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.3685328561, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.3685328561, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.3658600192, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.3498976319, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.3207894213, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.3531649912, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.417050865, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4432851519, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.3715079739, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.3707104996, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.3260490458, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.0061303673, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.2903885371, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.335969544, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3096036989, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5894510883, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3216244424, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4789560475, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.144851387, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.3910338598, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1495764445, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4378856093, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3212752587, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5721988204, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.2219217085, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4377428103, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6211549677, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2850762142, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5782236467, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2248107417, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4984063423, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2675115771, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5494472553, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2760145633, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5472296546, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1190236381, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4338558862, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.0066610109, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2253645306, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4365811374, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2833608714, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3821473478, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2384175484, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3448132553, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1008538575, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.2775527241, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0986453416, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.2775821194, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2822535302, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3818556455, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.280776323, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3839514513, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2404134304, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.344918308, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.326601159, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4364077249, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2833608714, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3809827865, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2479641381, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3530186228, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.280776323, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3839514513, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2822535302, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3830564706, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1403980983, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3014356895, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0721876611, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.2401825003, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.2096419314, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.1385791043, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.4126877168, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4336894555, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6793717377, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.389931314, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.389931314, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3595137195, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5619162674, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4336894555, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6377690736, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.1051184684, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.3307148671, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3869431776, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6962124663, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.516541323, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.8152163781, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4336894555, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6793717377, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4338387817, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7219938498, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3541059576, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5902080019, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.2710444516, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.007378883, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.164407913, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1838494824, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4093528825, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2005032061, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.404629107, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.2514998026, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.2514998026, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1457983702, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3459916112, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3033939025, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4463607309, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3233187869, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3163833715, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5386981919, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3151852084, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5072004559, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2761603008, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4920769651, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3151852084, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5072004559, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1317003425, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3663183541, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3305034077, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.0045167118, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.169519092, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3380125248, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1280220257, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.3766998615, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.416179145, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7054426787, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2033344819, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4983193477, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2033344819, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4983193477, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3254455687, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5778522195, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3387562718, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5665592722, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1326765652, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4541518793, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3366708947, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.607430123, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2812488198, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5695765898, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3968896527, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6463733324, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4272870064, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6682855797, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2934521274, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6135709647, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1477219991, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4266201925, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.0087779927, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1228888706, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4148619357, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.9025232868, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.9169897591, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.9234732619, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.9472986864, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.9709835434, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.9951728991, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.9154051169, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.9757471795, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.9154051169, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.9757471795, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.488843684, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.8291158209, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.8935248372, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.9404428602, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.3898504851, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.283078907, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4185889715, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2013008816, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.3833494605, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2013008816, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.3833494605, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.1958598295, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4312028681, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.1346180129, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4435148347, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.3120938793, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4489929043, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6339860404, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3419664739, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4931724445, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4844328957, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6798474086, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2430565018, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4691227883, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3674668905, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5894468069, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.3523079658, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.0064546295, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.3609285379, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1726893279, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4780619493, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4206772002, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6309653613, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1333644801, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3748218957, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1333644801, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3748218957, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2482192664, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4055106297, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4501073963, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1204951458, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4795015038, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4238285605, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6321659688, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3950163282, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6461322925, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1631012195, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5625465668, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4126152035, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6344543164, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2934068087, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.600317977, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4234709963, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.0018234865, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3722685689, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1528571341, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5481360184, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2216635866, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4583410423, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1954411147, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4036830499, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1954411147, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4036830499, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2247892007, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4500155517, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2216635866, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4583410423, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.3439068947, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3721973766, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6020217845, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3552281814, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5990409134, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3528573301, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5945202859, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2247892007, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4616910894, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2247892007, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4616910894, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2285747292, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4605153152, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.0053042353, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.3330162771, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.332321774, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6558414584, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2460137258, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5397894338, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.1633194828, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4628159238, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.1633194828, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4628159238, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2745762486, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5421002898, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3925121365, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.643584629, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.1692731897, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4309064189, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3961867597, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6547203688, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4746791389, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6998445451, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4717991357, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7489646628, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.5170969058, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7999241779, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.38137071, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6705221265, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4009045958, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.0062606533, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.1719397296, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5092585684, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3235165185, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2718533021, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2138567563, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2138567563, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2690830377, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3016154988, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2474285713, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2253741272, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.360901998, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2291097883, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2853435398, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3383777404, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2591641361, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4126422186, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.311172563, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.0102750381, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2967639009, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1960019004, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.2537357993, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1954328575, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3029305354, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.2071779261, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.2071779261, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.194619192, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3021113005, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2056729933, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3053087014, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1499818073, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.2781311728, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2798694982, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3524034145, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1964914647, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3024070513, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2791475974, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3778334877, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.0101876973, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1176706289, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.2588701936, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1399347491, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3090683794, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.0077929146, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1565204883, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.305815155, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3539896048, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1617717219, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3565629456, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1151530993, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.2804443217, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.2363853115, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3189572638, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3821381274, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.010064649, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1649693878, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4294879893, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.279887694, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4858922584, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1196671345, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4209144884, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3486123944, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3458399031, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.2786084205, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.2081033081, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.2303364277, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1772984226, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3991460048, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2149405271, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4080242659, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1092529726, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.2403375927, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1092529726, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.2403375927, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1533740475, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3658108225, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1662870105, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4031359333, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.0226740824, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.307322971, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5740871392, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.3079181031, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5601926721, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4511589056, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2434623104, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5966001227, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2796635629, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5478435692, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.108451829, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3117325187, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.0077929146, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.409152887, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.1598051812, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.3462061116, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.351387494, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5764814747, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.1677193014, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.1985794341, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4388967512, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.2274336387, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5072109324, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.1674968498, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5366411242, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6918385856, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.342337572, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6262531467, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3091394458, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6747861906, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0221846327, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.1294619581, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3243466208, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6005859006, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.1379662085, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.3567938876, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.0072819023, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.2168690547, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1557851967, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4636631211, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2069099661, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5406044734, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.293995569, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.293995569, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1155471624, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4790979458, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1931272038, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4821357997, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4908356679, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.5295250577, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.6698621491, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.3689615672, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.6019015041, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4295721432, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2396621968, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.5979264101, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2396621968, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.6128846774, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2583014514, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4896048355, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.0067786449, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.2846692049, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.2549174311, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1055673772, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1405378973, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1220184218, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.137776577, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1503218495, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1092963702, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.2609493813, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.2814587488, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.2998660085, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.296140964, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.2410288519, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.2970891902, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.1312237252, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.124599145, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.2338987151, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1466978554, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.3937770502, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1466978554, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.3937770502, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.1863486844, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2958648967, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4674087352, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1583367284, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4191767182, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.2674756847, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2033250077, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5589196419, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1497342212, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4249764679, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2005714669, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4559416667, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1850611533, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.509686347, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1843925187, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5106980997, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1139465925, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.3384585011, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.0078664799, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.3386070409, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0727163379, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1159663279, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0888022338, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0888022338, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1302790809, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0820818031, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0888022338, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1901593117, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0917637885, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.059324049, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0403549452, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1253385069, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0872222222, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0608409053, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0831610736, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.1939325545, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2188350648, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2418125754, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2727542435, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2418125754, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2727542435, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.212419655, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2485607523, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1218157576, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2369888395, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2109910814, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2461989424, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1561508712, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2966884812, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1601280792, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2825590658, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.209922403, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2402975944, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2164643623, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.014140613, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.109588603, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.267664271, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4581555129, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1876296055, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5048762255, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1862630066, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4752534997, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1862630066, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4752534997, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1847479638, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4904694577, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1876296055, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4918089443, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1196068924, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4380448627, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.187962177, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4755181716, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1984324635, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5123967771, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1984324635, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5130090742, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1847479638, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5111651781, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1876296055, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5270918783, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2693835819, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4662532233, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.0065650315, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2839390003, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5191104889, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.1930763339, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.3425655074, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.3554016411, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5028380577, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.1929043129, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.343894644, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.119986095, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.3020689312, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.1902855742, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.348122705, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.1088065443, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.3608349901, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.1393878238, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.4352047032, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5881445233, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.4619867536, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.571476398, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2573016641, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4456135188, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2318569185, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.4329605534, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.1967483629, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.3689264104, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.1019995266, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.3466033417, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.0062219109, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.3231291403, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3129163386, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1530025229, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5221038027, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.2758817099, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1775856953, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3914970015, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0374428024, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.231425496, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2398704714, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5083946276, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.2644204377, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2534901676, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4596959756, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1264591584, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4570024161, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1955198139, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4488382703, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.0064382431, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1217984232, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4354660336, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3256050777, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.1640209092, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1495764445, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3511309251, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3319100075, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3269259733, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3003972272, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.2947899275, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.2944087567, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3007628552, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.2702894645, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.320107511, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.320107511, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.2133605239, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.2830838263, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.2838681982, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.0287570777, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.2071550002, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.213802859, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2051692646, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3224454187, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1784284488, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.2891589197, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1037234403, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.2615059404, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1507296995, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3087381775, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1316423588, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.2949567194, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2879469255, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4591810337, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.2036293977, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3339929789, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4683082257, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3299531546, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4840937399, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3013756361, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4662399448, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2639764335, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4159003903, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3023095133, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4131900681, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0378007652, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.2260779872, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.0059620333, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1341990972, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3116082737, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0882299774, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.2497472444, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.09500509, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3165301597, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.2360982005, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.223674024, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3129137956, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2554146381, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4265387921, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.2609135479, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2494006679, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4342326034, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2494006679, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4342326034, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.3493604523, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4829868974, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1220951694, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3186107105, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3009720608, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3149833038, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.0075802493, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.2029445208, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.0084444188, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.111834477, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.2981154499, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.1947081063, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.1947081063, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2224158573, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3993550498, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1946918133, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3702922644, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0988151148, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.2615108001, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.4144465172, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4950881105, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.3110891871, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4573498365, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3707041919, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2756918914, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3996541462, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1977587697, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3524925021, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.219417732, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.0084230799, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1683248432, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.2952766411, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2188392829, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3942803458, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.2796517015, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4132532584, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2864494973, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2857216432, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2875582279, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1619591902, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3600614648, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.0100403957, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.190862037, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4060355609, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.38060343, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3652515754, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1900136998, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4038079481, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1589291335, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3853450613, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.171793937, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4061991091, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.0101135087, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2723477674, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5001337106, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3928482205, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5731994852, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.3224419519, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.3224419519, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4583677549, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2864900352, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4754058247, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.52596811, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.693890502, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3961580558, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.625810777, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.3961580558, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.625810777, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.2029652695, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.4014874095, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.613612103, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2989898445, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.5666357652, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.0063886488, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.3936073912, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.106602827, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.332890707, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.3228478591, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5391266649, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1221622381, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2863088425, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1175116376, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2639231373, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0861688523, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2353641921, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.074582274, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2600891963, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.1070404755, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.3125785782, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5024602461, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.4145206536, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5450885611, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1353204366, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4699960908, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0448678445, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.288128037, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.2583416801, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4801148644, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1064989243, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3005075192, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.0072504791, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2196332371, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2801468316, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4843599291, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.3355724432, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.5209156086, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1447589271, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1630920646, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1319426591, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1536584418, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.3886375628, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.5670767165, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1992351466, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4391618609, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1087116451, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3428376126, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3944787953, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3341922275, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1639598245, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1134519688, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1586668325, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3553678594, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3430358969, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6476809, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4310358, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6690742227, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4583355789, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6740129256, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4583355789, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6740129256, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4788542814, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6734455798, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4788542814, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6734455798, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5108209375, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6791666897, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4330463947, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6198346106, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5730366637, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7197637549, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.2981426768, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.5882799317, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4263005629, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6688425476, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4263005629, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6688425476, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.448546207, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6460034218, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4579102349, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6417119032, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.6252078221, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7406162627, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1309326502, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2442359455, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1077233201, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1765271437, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0905841537, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.248289409, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0840969341, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.242819879, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1864036495, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2818846538, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1199713969, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2490954872, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.123262375, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.254313875, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1775513273, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2793955277, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1155244934, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2255572925, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1445047538, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2737322242, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1957899789, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3225341744, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1998983872, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2754449185, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2128604974, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1372480434, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2232907499, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1496936339, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.278209861, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1656131533, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4491486314, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2719091012, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5173567852, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3764808757, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1673300635, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4300982092, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0985132569, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3616605985, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2788187959, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4519726809, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0810847933, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3244624256, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2985215838, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5357534811, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3606261468, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.565769528, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3485454775, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5565027261, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1959348788, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4136765524, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1959348788, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4136765524, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1445526834, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3511816606, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.0883951234, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2117778162, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.446074174, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3118437334, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.497891952, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4295120748, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6066779955, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3766108383, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5627715651, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3766108383, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5627715651, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4257605184, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6026940597, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.414619311, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6016308463, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4185497913, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5947798106, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3965389355, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5591087327, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3545643809, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5476462735, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4051802203, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5707666164, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4257605184, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.607262076, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4249672153, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6168976239, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4296327575, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6275089001, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2428722039, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4829182995, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2730932205, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.516225585, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0995061577, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4145753205, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0959613693, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4084914721, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.373654149, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5663575595, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3931799632, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5715002055, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2160624856, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.478097701, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2076886079, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5045131604, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1948267249, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.3739720454, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2254652167, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5396972089, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3347794279, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5836257841, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2350277891, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5533644883, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3288562545, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5875530352, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.238581611, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5352521385, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2234569427, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5021464202, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.024449793, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2574839776, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.49702079, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1855526569, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3943451217, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2297263148, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4361029888, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2525918505, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4202404401, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.1576533178, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1587543502, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.411444362, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.232526345, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.417692446, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1028903377, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3479245449, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3554132463, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4941662759, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3898899982, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5383555577, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2674575412, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4673846703, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2180807047, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3966492623, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2101112712, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3666764488, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3330574461, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.2611660786, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0919692294, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3595019474, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.389624004, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.603937614, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4502696568, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6668256174, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4074412821, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6128620945, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4074412821, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6128620945, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3106689221, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5821286482, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3894734858, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6093782293, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5193184368, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.746884081, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.7296050985, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.8833183866, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3096348872, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5646940504, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.558567416, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7915059223, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.2950403708, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6837809128, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4893545471, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7097085615, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5723452381, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7571087352, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.4468091302, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.6484739719, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.8247818102, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.385113737, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4710260495, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3719027199, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3530084317, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.467731789, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.386998289, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0977318386, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.425815692, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3787500122, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3752043812, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3543538316, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1023588184, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4279439963, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0923037226, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4084071496, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3777505211, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.0964962294, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.2927581008, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4313197463, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.636712966, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.310186303, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.543454013, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5844803971, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7063190919, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5844803971, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7063190919, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5201565256, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6663170491, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3234262987, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5509482497, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5471998982, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6620274291, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5471998982, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.668797436, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.6201952807, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7357975825, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5950978682, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7209575533, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3663414044, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5925773492, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3935907912, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6064279839, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5201565256, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6663170491, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2672991325, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5378982231, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4880149105, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.717746493, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1395079697, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3461520644, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1720725885, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3052503499, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1904797464, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3156575555, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1904797464, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3156575555, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1377448219, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3565144752, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2859947827, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5006114056, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.2479775296, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3393109592, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5094767086, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2557823082, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4595913832, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3653634813, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5239315135, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3001926669, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.520168227, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3405782536, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4740333086, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1995574589, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4701104981, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.0229251189, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1079399157, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3418311351, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2328843209, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5712248207, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3779494671, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6288808547, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2784369069, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5290670344, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2854915274, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5160719091, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3335574881, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6172751686, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3081962527, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5915465658, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2539395182, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4638805677, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3935985209, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.626545906, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2472010935, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6067542031, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4719455252, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.644979373, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.1043683969, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4723697955, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3081962527, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5915181594, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2500390778, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5740099623, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.104807088, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4347737896, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3712375815, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6205370333, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1663603559, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5225044219, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2834162669, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5869314876, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1827972236, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4782583533, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1827972236, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4782583533, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3449624286, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3999239566, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3948810099, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4292943493, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6516072033, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4295114388, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6426984036, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1977166163, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5115994004, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4457322258, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4346320451, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4980697864, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.0080863887, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1778191605, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5216356192, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2407843507, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5511929774, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2339948566, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5631067041, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1900264384, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5613137257, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1900264384, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5613137257, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1508468192, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5314568463, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2698196759, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5640017836, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1191106613, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4416525185, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3181824678, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6229693134, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3519053, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6501952974, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2880997378, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.595204668, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3315037522, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5881480424, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.174036476, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4845935914, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3337338879, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6611983572, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.0189032129, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1721831215, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5841092375, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.180817191, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.52074883, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.1793410088, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5126133937, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3585760941, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.599983087, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3585760941, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.599983087, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.243284204, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4502822427, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.1281916094, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.3968207935, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2846273714, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5068034605, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4008628433, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5958332944, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3938117685, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.568306575, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4150528219, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5557512736, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3369338117, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5939057048, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3369338117, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5939057048, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.1852365018, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.450559933, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.0736727261, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.372116922, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2571225648, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4854433762, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2762822898, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2494209435, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.7065161304, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.8047179188, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2353716486, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.6897992635, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.664271838, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.7768492312, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.7660237942, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.8523393041, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1948202342, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4675579314, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1935591956, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.393175963, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.094174565, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.094174565, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.070940725, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3513533312, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2310435477, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4038592288, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3633072012, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3592209878, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5721408825, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3272043177, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4954062101, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3322425568, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5053022384, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.240029446, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4281869814, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1466236181, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3944286703, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.2613422109, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.255011496, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1803847357, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3719715144, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1169629983, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4181595169, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1674342436, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4331161882, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3473759202, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3434479963, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.394388905, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1375487849, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4400994485, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.2623022556, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.096669262, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.438593587, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1065549802, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4300714729, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0857082791, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4443126848, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1126574422, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3948153025, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1365091799, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3971858557, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3430299755, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3015299042, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3404467437, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1148193499, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4747875328, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2089685256, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5333424925, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4677716472, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.15744827, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5597535179, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3906806786, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3750346311, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.2612523014, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2789924976, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.543733561, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2764393753, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5214300182, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2152132516, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5498176883, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1894855225, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4888270048, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1759239126, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4635136213, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0878497559, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4566528138, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.0090200253, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4228408463, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.1432651349, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4797608005, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.1296922312, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4475369521, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.2581548973, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4911644025, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.1492903381, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4767021982, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4674650269, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.1036222283, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.2553804995, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5077415231, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.1653107113, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4890742062, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.176873868, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5306318459, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.1432651349, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4846286435, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.1432651349, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4878418865, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4272306128, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4315166819, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.142894354, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.3929455911, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1215403961, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4184192896, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1541530225, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4123343961, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0775634737, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4117418041, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0535817236, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.3281836072, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0590068622, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.3017162869, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1065084631, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.3426366343, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0516461144, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.3047911046, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1299080632, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4208750314, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1673384901, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4752813132, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.2800051946, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.500208218, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0658346467, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4505447671, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1746139174, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4282897634, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0966569429, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4197271808, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.1157800433, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.4640603999, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_to", - "metric":"bleu", - "score":0.0631213929, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"translation_to", - "metric":"chrf", - "score":0.3372424748, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.205876731, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4757245821, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.180871406, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4377272236, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.2525417661, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.2965045198, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4697814784, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.178820686, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.54085956, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4609622407, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.205876731, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5260086668, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.3332535149, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5948182732, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.2847897935, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.6101591431, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4978503857, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.5116515365, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.1417026145, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.4360186126, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.0098169765, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"translation_to", - "metric":"chrf", - "score":0.3984749327, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4757656003, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5469867444, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2200045848, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6138504492, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2200045848, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6138504492, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4083641834, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1323764586, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.4485561487, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.2399509189, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.2300556724, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5929496963, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.219805034, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.561473329, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1820057458, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5620165305, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1737720879, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5789527486, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.1761368775, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6050330397, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.5589534921, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.3896603574, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3272263309, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"translation_to", - "metric":"chrf", - "score":0.6208501228, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.1596886882, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1818063041, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.1803476066, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2058773576, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.181205062, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.181205062, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.146370162, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2032908752, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.188429759, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1707584036, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.1740044679, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2160551293, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.091656988, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1443459994, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1524760852, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.2009965683, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.1675740495, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.0836150448, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_to", - "metric":"bleu", - "score":0.1474542551, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"translation_to", - "metric":"chrf", - "score":0.255428437, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1925903911, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3671206202, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3147902136, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2726119138, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3161459452, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2424470037, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2655680598, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2291992284, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2197204636, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3190137698, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3179398168, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.2163965996, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3162880684, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.1927621321, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3542214625, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.3738879431, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2901450732, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2702695112, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"translation_to", - "metric":"chrf", - "score":0.2214472509, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2755198906, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5356254488, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2693653653, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5351323892, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2804805733, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5173444818, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2804805733, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5173444818, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1635191686, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4804882398, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.265269838, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5353598123, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2665145369, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5171512452, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1837403354, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4991399242, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2435306777, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5166317384, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.2294197979, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5102280024, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4534476471, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4578627549, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1999115917, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.5112420302, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4166251963, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_to", - "metric":"bleu", - "score":0.1741974302, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"translation_to", - "metric":"chrf", - "score":0.4671523919, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2552675719, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6364430512, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.250320284, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6628587961, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2405359057, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6655821854, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2778012827, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6711394083, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.216299191, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6724473561, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0948518028, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5297797609, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.1999424541, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.4644985338, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.7639212954, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.4646770361, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.7875365173, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.1987579861, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6616311958, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2454606701, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6558538403, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.2446000556, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.7189156627, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.6314478475, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.3935354454, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_to", - "metric":"bleu", - "score":0.103011753, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"translation_to", - "metric":"chrf", - "score":0.5376516921, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2828935596, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5240089168, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1519763037, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3903562094, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.1709646164, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3692462955, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.3058932495, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4580316608, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2215392629, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4125710291, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3329262969, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.2369770576, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2718193327, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4809886758, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2361834729, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.4962696728, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.3397501129, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5046267909, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.3039889131, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.5189316342, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.2737404369, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.44170111, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.092767342, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3473883139, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.038929275, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"translation_to", - "metric":"chrf", - "score":0.3715413713, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0809290516, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4032555174, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1767721526, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4249279437, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3167136634, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.255618614, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.306603334, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1367094874, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4671925185, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.2630232513, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1467727892, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4397670836, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1550649276, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4475601469, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1157245386, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4035026532, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0860958371, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.393787114, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.1517985731, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.4250156741, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.3082198822, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.0966398396, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"translation_to", - "metric":"chrf", - "score":0.2862332781, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2830521146, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4573087433, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.223127008, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4189240455, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.206879059, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3623403977, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.206879059, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3623403977, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2257991293, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3783017116, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3297857792, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4292403961, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1408857027, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3918583818, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3766280281, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.5618752988, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3092686619, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4734674396, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.3237982652, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4625824766, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.0091986566, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2595791359, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.3835676033, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.2430631877, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.4371598963, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.0180364018, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_to", - "metric":"bleu", - "score":0.1762869532, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"translation_to", - "metric":"chrf", - "score":0.356746255, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.2341631594, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4208857451, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.3879139891, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5307069805, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1152547411, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3599175709, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3149088323, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1910771867, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4125999495, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.3452401484, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4895068008, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.3099441998, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.474264638, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.5050428988, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.649363596, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.4052322981, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4961184708, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.3328216606, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.4941913603, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0538790208, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.3802149154, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.3139213226, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.575489683, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.1245312761, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.2986317421, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.0072116343, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_to", - "metric":"bleu", - "score":0.3243463644, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"translation_to", - "metric":"chrf", - "score":0.5301315753, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1864340365, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4740941038, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1594253066, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.515199742, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1551207146, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4522222517, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0756226321, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4040528518, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1124795147, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4918141546, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2603725862, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5454235945, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0734366066, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.3787234084, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.2921802716, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5926371898, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1112538229, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.533369486, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1666927839, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4915920022, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.4116397174, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.6347999526, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.3447572227, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.5387838115, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.406275655, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.0459639636, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_to", - "metric":"bleu", - "score":0.1718898827, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"translation_to", - "metric":"chrf", - "score":0.4922742182, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3490672285, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3280456612, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2423006903, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2645571441, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.1302993662, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.0393538696, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2024319322, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1186565949, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4372933545, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0704339795, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3852802461, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.322786472, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1462796114, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4462737548, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.1538766031, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.4518012669, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.3286241329, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.0087210906, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"translation_to", - "metric":"chrf", - "score":0.2647246445, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1191908679, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4518769869, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1061568454, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4600466173, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2305452794, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.496079091, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2305452794, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4915475454, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1386942877, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4645315408, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1001225427, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4079376571, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.3829530313, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.2284412624, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4904265148, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0905195403, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.3959277285, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.139731585, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4245791517, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0969377042, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4325087281, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1367597636, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.4986242378, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.3765622773, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_to", - "metric":"bleu", - "score":0.1258832954, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"translation_to", - "metric":"chrf", - "score":0.419555188, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0724367167, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3979807617, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4139226962, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2471636446, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2382081559, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.0749853243, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.108464803, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.1308609485, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.105338613, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4856442758, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.1670515635, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.5251495423, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4006386976, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4223466542, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.4355116712, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.2548887819, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.022883129, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"translation_to", - "metric":"chrf", - "score":0.3391502707, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.118230532, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3361401069, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1383920988, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3531514774, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1030654075, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3271343056, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1030654075, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3271343056, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.0793438981, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1105560791, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.320368514, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1386295454, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1044701548, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3834682647, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.1570432712, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3293030041, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.2498554087, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.4335702335, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.3398774919, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0976308886, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.348851692, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.2863678077, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.1746004151, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"translation_to", - "metric":"chrf", - "score":0.2874462969, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4.1-nano", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-4o-mini", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo-0613", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"openai\/gpt-3.5-turbo", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-small-3.1-24b-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-saba", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"mistralai\/mistral-nemo", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-lite-001", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat-v3-0324", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"deepseek\/deepseek-chat", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/phi-4-multimodal-instruct", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"amazon\/nova-micro-v1", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.5820808184, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.7378873385, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1919493791, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5477665664, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.615298028, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.831128159, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.6242817472, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.7056438934, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.78254229, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.8503171628, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.3045613775, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5275070803, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.3857436691, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5750224388, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1547142813, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4580211317, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.6595394847, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.8217096607, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4006636128, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6653649738, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5682331555, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.682737177, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.78254229, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.8503171628, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5398261391, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.739237388, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3288580455, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6084553206, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5076849582, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.710481583, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.4670851532, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.640678121, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.3448470566, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5402688339, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2920008663, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4711920796, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2662895143, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4434736704, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2101630852, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3954963698, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.9144679601, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.9686368875, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.60448204, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.713020803, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.5946618487, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7171023095, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4224822178, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5623149154, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4122044215, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5511084783, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3021398447, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4574822139, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.5447134963, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.726199366, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.4632506462, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6209714942, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3603147151, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5689403612, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2116090792, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5313905407, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1932686964, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5338237269, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1694466725, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4902502032, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2336537843, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5428777593, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.443810215, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1404085144, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4142346468, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1351908298, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4077309037, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1587457184, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4183751517, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1056537246, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4443809914, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1360715984, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4245026254, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1345824232, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4423141278, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.23544416, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5020320865, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.069857125, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4602606238, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3208741194, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5929208087, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.3932292316, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.6872277876, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2733878926, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5225641007, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2377604053, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5662768009, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1415253671, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4694433068, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2323385181, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4886113482, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2868985879, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.583221409, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2692065609, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5743171011, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0090442457, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.0499217277, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4528624345, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6527368961, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3520774812, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5857728616, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3964697637, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6290180588, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3608351362, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6215415104, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1642435584, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5707570207, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1188717945, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4725226647, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.7329410356, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.8247196817, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.6230832294, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.70254087, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4021461277, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4512842459, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1977587697, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2528519998, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2926148803, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3659823921, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.6244631487, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.6931369519, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.7329410356, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.8247196817, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.6095824652, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7240463525, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.377622704, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5372679696, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.7329410356, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.8247196817, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.6242817472, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.7123666275, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3627848276, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5349346533, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2376748633, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.440987821, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1398001346, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.2973979681, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4869882768, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.3770929789, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.7019510305, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6290393497, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6364887817, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6290393497, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.3349151749, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7148385237, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5600030479, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4173415078, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4205225801, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4085415213, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3963957407, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3958941272, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5291971593, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5291971593, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2538527855, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.6210036405, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.614927324, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.8453493909, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.5738396575, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.7983571334, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4741000223, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.7538467008, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.5465526716, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.8012679277, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4814564802, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7621649609, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.5465526716, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.8012679277, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4814564802, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7647955332, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4489771072, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.686224909, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4246163318, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.671781609, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4047272002, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6392900614, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2704091954, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6207272323, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3014335252, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6287268013, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3025029866, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6057244918, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.373921491, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6665214662, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5576394962, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4881010345, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.7314899377, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.5014756678, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7958858212, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.6255340042, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.8724783049, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4012328255, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7187563586, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3226386416, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6744253147, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.5955978089, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.8632174103, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4899456142, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.7411155087, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1107650255, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.331093823, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0936832192, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3110560184, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.260645177, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.509220611, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1723326961, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3877418094, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.15753944, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3831139958, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2401586038, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4322848605, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1492962176, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3813364386, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1313896619, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3949801414, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2586476023, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.537961002, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1858144172, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3809051081, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3340180482, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.193567336, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.399276763, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1322628325, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3875130479, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1242329075, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3279678425, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.4333488015, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5993145227, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.5065289744, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.6530054778, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.362151759, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5866873582, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4573456096, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5806207458, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4106942927, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.493809375, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.3089009202, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5553909583, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.431864811, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5834549494, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.431864811, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5860075143, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2974074485, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5163339434, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.268182028, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4507857635, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.5116492273, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6206166199, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3716332024, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5698425038, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.5234484809, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6059134319, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.4960837619, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6960674548, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1905565033, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3977300361, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3337408701, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1180905709, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2793034278, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1580433751, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2141111475, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1145586442, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2150669504, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4251675823, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1633896822, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3860270758, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.2597384744, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3657744669, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.128481541, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.1828802623, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.2728731894, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4511791218, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1381958549, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3096769616, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1511224641, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.42313984, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.6179728224, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.8116973109, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5643083887, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7795248833, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3915127524, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3962800718, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.4327180981, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4441466437, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3656382407, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4042109174, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.9144679601, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.9686368875, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.60448204, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.713020803, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.6198967678, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.7481269522, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3405810806, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6454109254, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2939245264, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6089201616, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3311313826, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6441268906, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.5238819207, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6661862665, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.489768506, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.62541231, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3367620726, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5105306321, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4710911328, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6679686333, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4271153755, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6509536054, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.6708620896, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.6530359035, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3922991602, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4080642476, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.4969402532, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.5304108265, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2530156938, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4697567617, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2440257845, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.492956031, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2535874532, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5215217562, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.465085908, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6778737063, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4395923922, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6587083356, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4784954271, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6488586266, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4253973849, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6618555851, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3483038073, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5875489793, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3445753349, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6264226575, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4648082019, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.5916357493, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.6197199631, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.718089441, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.5653218965, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.6143875608, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1509738618, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3420592853, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.131094091, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2800912841, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.241065739, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4304366929, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3261746996, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5353080845, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2098897598, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4360039344, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5158788412, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6415838328, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4892773847, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5670432585, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4237266446, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5153633128, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4305675865, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.63125083, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2993584441, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4918263974, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1353306038, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4104434302, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7828161456, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.8875256123, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7406375009, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.916098851, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2352525319, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1660437618, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.139825303, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1150338804, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.0793331743, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.7049592608, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.80590567, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.7608566263, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.881580297, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.6885326215, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.8229812189, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4489771072, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7135189441, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4747354911, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.73602868, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6373412314, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1509481321, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4327181828, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4695363242, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.3096153428, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.4869882768, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3770929789, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7019510305, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.5907010931, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.599558184, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.4663322216, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.455960373, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.4140442654, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4040328945, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.316429969, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.2723413787, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.293127261, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3545968453, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5519360559, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3545968453, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5304888393, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3631474834, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5430495415, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.3276500834, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.3308631604, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2294068721, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4395950991, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.2538527855, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6210036405, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.614927324, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.8453493909, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3061357456, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3616235652, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2074813196, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2716205232, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2074813196, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2716205232, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.6179396438, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.866516296, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2418068126, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5283791447, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.614927324, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.8673390132, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5440766841, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7530101165, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4024582794, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6686551997, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.6976333496, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.8331572108, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4500181541, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6036911111, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4010689686, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5585374123, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4507354055, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6086043978, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3567464687, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3675887542, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.4593860924, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.5045746405, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2591849138, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2552839984, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.4521224402, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.6051669625, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.397344358, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5535504661, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.4521224402, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.6051669625, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4226108217, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6331414172, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4226108217, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6331414172, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5521710658, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7317828776, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.697724039, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.8189844672, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.5582486914, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6678493404, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4298810543, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5792724215, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5339784399, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7711693678, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4906190889, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7085658773, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2977737398, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3247262668, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1310017131, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.177273908, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1952754389, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2613440611, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2720157532, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5659565995, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2030347987, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5105569012, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.231961983, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4927185777, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3860319194, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.57524876, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4062689293, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5780690651, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.282829374, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5953149441, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3541689687, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5902329125, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3451069968, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5535082901, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2107785765, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4505234165, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.1875920232, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.5919327752, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3166934923, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.5620795602, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1750913104, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.209260824, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1049851994, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1535119641, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.4501609222, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.6274091785, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.4352771378, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.6534533975, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.4378159931, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.6205808811, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.3753569138, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4322325533, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4103289978, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.5761410926, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.688570898, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2760145633, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5543439466, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3423551115, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6041763685, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5417436516, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.695816766, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3576389773, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6001423895, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.177282908, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2719652709, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1413097829, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2886321729, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1412980859, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2425598176, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2900517146, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5311383978, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2778215331, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5487851761, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2077534942, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4535310744, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4066949391, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5560688632, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3517429611, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5511188972, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4403845293, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6366618751, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.360602983, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6158556041, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1856902725, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4949007819, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2635679397, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4983679981, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1636530343, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3913206823, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2875119946, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5315730119, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0761074979, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3158679212, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2567884686, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.4445207366, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.8324660076, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.9190284212, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0252236217, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.2350943461, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2123133698, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4590317673, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1224029997, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.365840156, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0150426288, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.1539852614, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.1349904843, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1023838278, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4046574238, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2961253573, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3725426622, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.1554801198, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.2962569558, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3345606592, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4009450832, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.4095908744, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6348509381, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2544255509, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5578669986, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2119156724, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3642217157, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2432845012, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4594188595, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0389300424, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2121610889, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0831876221, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3467775152, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.144260109, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.295408701, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1325275948, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.2868277082, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0129900785, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.0487020134, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.260255736, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4700206616, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.0203225763, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.2537472768, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.221499195, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2366036239, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3671096926, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0861116128, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2872693016, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.127772761, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.2091659231, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3582184052, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1223177217, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3067683268, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1085135458, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.2968183524, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.113060164, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.1707299686, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.0759282022, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.3237722713, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.665788023, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.6028817682, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.8937427109, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2097342579, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6906917347, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6290393497, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.4014538132, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3835366017, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4043598708, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.334002021, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.2503824473, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.2998065854, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.794069319, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9226320693, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1946452196, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5440465293, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1434084599, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5451343313, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1287433051, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3817491925, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0688260471, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.400067684, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4489771072, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6575894646, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4246163318, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6463883518, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3191485537, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2383041257, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.4701506351, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1866228307, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5545156731, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.3558785149, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6251813349, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.3840594021, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.3507534175, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.618477849, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4216890914, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.6885217194, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.4899456142, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.7411155087, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1717217069, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.5514871631, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.168422147, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5027567893, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.4028460317, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.7393612332, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.0878049954, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0790804547, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.2408268617, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.1023361886, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0172835892, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.194726701, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.1025721627, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.0905735713, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.0756232112, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.0953372986, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.0988106272, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0834874022, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.2553727556, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.166411781, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.2001459084, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.1545164621, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.1855143879, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.110473448, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3041593885, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.1804638322, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.1811318093, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.1685996647, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.2265701279, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3513520405, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2778201384, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.5065446933, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0924108658, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2418907918, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.079149304, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2273620457, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.1435893752, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1284649702, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3014976338, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.2319908563, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.2269289302, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4654311956, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.2755380202, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.372032093, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3288127617, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6382679381, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4946107362, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7394349768, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2152501401, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2654640308, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2884343177, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3291519059, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.8008661202, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.9129539473, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.1698386907, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5144379459, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3092944545, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6266544541, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0657005581, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.2947780789, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3137846786, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4985936683, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.1549348297, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.4736195958, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.2789780713, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.601087115, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1571025246, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2212055901, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3167402933, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3785721087, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3084036356, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0601000445, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3175726617, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.1043885689, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5031786975, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3719832112, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6081799487, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4475531371, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6380525616, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4353318655, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6645574621, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5158575227, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6643754283, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5745763624, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.687021256, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0717361981, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1431413915, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.156097278, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.1424128147, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.1365597487, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.229649115, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.386677557, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3046628863, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4170366809, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0518711466, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.2199581403, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.2197413853, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.2931324887, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.1888670976, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.0095785441, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.0050813008, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2848931828, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3884407274, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1943067625, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4717898077, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.0694363994, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.1976332727, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.1177403558, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.0711623755, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3237722713, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.665788023, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.2392351113, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.6943484573, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.5984586488, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.6238768677, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.4272048647, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4259865555, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.1935113177, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3748723088, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.3817620388, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2483533682, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5232389057, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0922109858, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.2837702298, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0921248009, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.2769793882, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.794069319, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9226320693, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2054802437, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3122579263, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.239302102, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.179372441, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3752584533, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1028840244, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4033391696, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4165530721, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.702780513, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2484897137, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6199962672, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.1179759499, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0635345617, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.2585313798, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.400754312, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7800092296, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3240818894, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4247828944, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2677722329, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3611863851, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1043129334, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.2753581328, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2930072899, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4492540807, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4226108217, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6331414172, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5521710658, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7317828776, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.4044783343, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6186227035, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2444794643, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4568302985, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.0836901996, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.2618756815, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.1104532827, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.3509896821, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.094994277, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1291356082, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2958409147, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.1252923366, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.2108983192, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.2159783664, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.1783654107, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.4789052847, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0337967386, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.0199232745, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0523099661, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.2825860966, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.1870347306, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.1221966748, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.3810153226, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.0485063199, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.0930869606, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1029370477, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3804609625, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1418924299, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4180976485, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.2042570146, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.1441370455, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.0356225175, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.2348600433, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.1469924855, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.608209796, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.1776359359, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.5545126298, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.2219387721, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.1036508893, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.203729846, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.100168205, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.371442108, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.1670515635, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4145311709, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3498701287, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5383179684, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4455798194, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6134429567, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1064401296, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.3072138741, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.3436298261, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.474097066, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6509090647, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.456459237, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6180934331, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.3099822675, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5099477959, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0817187191, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3010070158, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1065141414, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4142627902, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2955647067, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5006575555, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3495042928, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5226314495, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.305198761, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5067245421, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3287552112, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2284332894, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4306199293, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.4251413992, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5934850967, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3681660378, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5541114417, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.4107741987, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5940312712, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1053000041, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3555014165, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.2543887713, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4829008172, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.4512944754, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6017904208, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.4209183126, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5827229431, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3624018198, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5452543645, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.34346098, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1644848431, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.3801831706, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4678277773, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6774531401, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4983736733, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6501877931, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4753487652, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6537763314, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0922659318, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3405122933, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.283423467, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.5292367321, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4232366468, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1254519534, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4649420285, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0824102434, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4192858928, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.0890330137, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0547100649, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3744525539, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0895042627, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.419071051, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3763004098, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4072803846, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3370553078, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0573570783, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3783970168, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4414911655, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3831814619, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0688668932, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.41744977, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.2303344611, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.314884268, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1505038282, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4714951011, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.3873416882, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1192169435, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4496293774, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.3025316557, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0795904781, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4188916198, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0902660698, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.460318013, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0850719245, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4573773027, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.16730389, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4802816707, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.1205394894, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.328020777, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.3522044896, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6269953758, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2424196213, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5404432592, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2677475159, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.55614295, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0744305025, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2827880483, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0450255942, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2390092638, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.457706572, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6729985528, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.196195789, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5613321222, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0054491617, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.0261580293, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.156821759, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4423947018, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2877677723, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4559192838, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.2737513623, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5787848381, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4853636565, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0087183267, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.0500524394, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3506712655, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.2866221441, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3878152533, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6512757513, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.17157837, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5548432095, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1387226548, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4849321762, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1016310669, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.3724573242, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2031034196, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4121574695, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4586552516, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6547109311, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0878922652, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4940541478, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.286326551, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4941431815, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0851163094, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.2122167121, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1154677212, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.2305118351, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.4093301993, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5021029088, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.52087071, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6374458452, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1784687728, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2562032816, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.1746034236, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.1055048277, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.6242817472, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.7056438934, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.6242817472, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6834390596, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.5364361873, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.627403903, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.1367747893, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1566391541, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.2864960007, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.5804511284, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.6874078611, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.5806197937, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.6900625849, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.4685280966, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5440874151, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1586707737, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.2202068136, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.1119693163, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.6242817472, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.7056438934, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.7329410356, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.8247196817, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.4390960898, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5382986509, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1534613282, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.2492580245, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2563868558, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.3514140972, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.5653615736, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.7346706701, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.7329410356, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.8651210439, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5118761227, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5118761227, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6265140754, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2100449053, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3263180094, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2289415686, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5250258007, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.296609032, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6426557362, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3541296817, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6426557362, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5533112693, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4508965266, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5396070985, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4063253296, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3419150962, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.315903662, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4627030912, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5639241777, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5537700016, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5316691911, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.504409738, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0549338636, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4999854027, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.50663118, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4763442923, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3927435572, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.2794663372, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3717046642, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.508747354, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.7773819133, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.5091224919, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.7829685247, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.6374542947, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.8113463692, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1512514933, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3464954765, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1929725997, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6525309891, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.5300714513, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.7461630751, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4596980088, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.713787746, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.5311807486, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.7051928034, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.5271017465, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.7749613595, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.5929835222, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.7236869252, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3231203125, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.581227569, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3272712268, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.6272846474, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.476501312, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1753767087, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3729722122, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5122282714, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3485799123, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6090575372, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.5948590702, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.7529648154, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.373921491, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5833802647, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3556254906, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5824692855, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.373921491, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5833802647, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.6912804408, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.8416888527, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.691790174, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.8479928839, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4246163318, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.7159049341, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.1477240637, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.2327576131, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2357664507, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6409280879, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.5088645485, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.6991726442, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.4262626091, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.7324097685, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1523704379, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4210744226, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2848931828, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4861198407, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2445665611, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6506028605, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.483123361, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.7122562458, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.429848247, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.7369844405, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.4222184785, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.6896985035, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.351603568, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.2596893636, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4210960583, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.5955978089, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.8632174103, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.4896430867, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.7719180937, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.538368094, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.7860964064, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.538368094, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.7860964064, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4803501445, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.7417101158, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.2541700511, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1902324956, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3942128595, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2552422097, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4216294389, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1447896195, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3253709276, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0699262958, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.259389944, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.0892217802, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.131072415, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2584637076, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4472520901, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1441045124, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3381676629, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.122121549, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3607027805, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.0625989807, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.243715448, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1784840705, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3773146619, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1264228524, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4004439009, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1382122903, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3045128799, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.0890466923, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0557104213, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.216182416, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1816921205, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4081546035, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1732368526, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.3754853997, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.1525816944, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.3564469116, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.1070898496, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.2488968735, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.2559913317, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4735475859, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1491176925, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3356762625, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1029560218, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3188749059, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.01957055, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.1384604485, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0644970193, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.186070028, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2029291889, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4389559342, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.3698141147, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.639725718, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2613937103, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4367528318, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.1804913727, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.1731635971, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3901529878, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5914927913, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3572973278, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5938598086, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.5798764085, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.7315592264, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.1514039103, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3237295268, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.2284852347, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4715534059, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.4555430851, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5838068897, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3648138383, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5508265101, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.1210537445, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.1498007868, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3016723427, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5432451702, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.4674098464, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6371051168, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.4226160792, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5828781766, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.0969128182, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.1598856966, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.9243310584, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.9496062774, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1231901756, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3813293435, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.123485244, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2904786796, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1903577848, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3976803688, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.1187002846, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0977192262, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2920573888, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3969902065, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3552315965, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3543141165, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3022575547, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4507970299, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1954384523, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4301384624, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.2315945921, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4615951366, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1942053406, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3370618041, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1098956591, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3237375736, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.0977190156, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.2596010789, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2702173265, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.3720094104, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.237030156, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.2253439878, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.127584973, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.203525371, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2429835228, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.3747255692, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.3117564668, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.1485542687, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.2660580737, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.2512653066, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.1847315745, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0928801768, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.2041289009, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3003447577, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5620618131, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3323813018, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5477871106, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3741170096, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.6055449675, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0656114778, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.2951585354, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1784558426, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4188092241, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4061568952, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6518699541, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4020514442, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6509497922, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3746270906, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6380910268, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.1762453728, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.504671061, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3215185636, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5791349893, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4755325361, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6374842744, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4484533205, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6383931955, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.5076686014, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6350257889, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0594898585, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3123751876, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2141312643, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4739909345, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.6967460561, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7979056259, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.6944088463, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.799967191, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.6361753758, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7575358001, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1982276029, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5051262946, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.437108046, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6307771712, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4747061103, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.6158670237, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4259946463, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5962845373, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.450796161, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.58968348, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1267020789, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3303949481, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2112877425, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4211760008, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.4359681894, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.6137125901, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.0936807422, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.0897891511, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.133135544, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3009760623, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5353758025, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6788324818, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5166175693, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7101611424, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4400802497, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6301890816, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3287546082, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5572127362, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4120156572, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5926345507, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3041322992, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5787393223, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3270717706, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5734315882, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2939892383, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.551250948, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.1239738256, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1157189501, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3665222597, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5285470049, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6459593469, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4870922603, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6355645768, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5703676204, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6777266038, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1526837546, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4440631927, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3189881179, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5210805105, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4580357196, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5956642394, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3545686863, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.476664044, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3913025208, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5316948713, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.1221432071, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.0614680937, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2688589697, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4353295321, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2116626486, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4353914696, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1733425858, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3740639944, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0138194749, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.1196538121, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0804447583, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.222199571, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3668184689, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5628733429, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.2364213319, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.4294193017, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3728320142, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5420862851, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.2440519515, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.4529255042, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3466721786, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.4970077017, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3102460718, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4859132577, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3100832387, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.516688992, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1857158876, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4023978635, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0535329483, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.2344463064, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0879680658, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3278294096, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5995988429, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7315867874, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3231992669, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5571408623, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3225927871, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5932287829, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2550011939, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.3917104658, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2093479658, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4547192309, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.173810894, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3434046187, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2754575825, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4306877567, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2072093311, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3223112401, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.0787144038, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0783667145, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.2005971699, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.232656371, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4141410184, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2330781491, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.411744251, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2594180752, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3896882194, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1274081046, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.2480867414, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.2218375714, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.8787419089, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.9422733087, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.6743295275, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7784500892, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5876945384, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7797337535, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.1694903428, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.2344927095, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4577470928, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5067481466, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.5143785568, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5594267639, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4190039313, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4865765169, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.111882946, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3046427465, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.2286082998, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5536486388, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7501188575, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.670001214, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.8763862761, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.367551136, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7215481866, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.1464248931, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.2659597227, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.5653615736, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.7346706701, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.7329410356, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.8651210439, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2809009542, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3474165677, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.2513991761, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3090015909, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5181373057, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.2632780943, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0358199485, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.1729879444, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.2071083533, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.4145586808, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.55739114, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6451717402, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.2717486771, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.4160165374, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.2628266816, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.4367566846, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3109559293, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5034602706, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2095138868, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4550960556, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3804736861, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6106280143, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5576133222, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.2486316724, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1020482308, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.2936250188, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2021077149, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4925372103, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.146872987, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5077161337, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2212877653, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4438446523, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1879777274, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.470758035, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2859826603, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5958071485, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1023261439, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3555649585, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1230470606, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.2572628072, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0868083223, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.2907268448, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.1236236637, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.1950558347, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1946452196, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3860511163, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3351322814, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2469263864, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3686991498, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.241258805, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4460812145, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1747094296, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3858452328, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.8330787011, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.9482515348, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.8330787011, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.9482515348, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.7359287727, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.862745653, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3725527931, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.634798751, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5815699185, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.8158797977, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.6556397462, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5244379347, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2251376916, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3221465444, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.5354063184, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5302628362, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.0661294119, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3908028983, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4988543287, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6529154911, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3532802306, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5839265502, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.45578637, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5808522375, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3026715858, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5333160005, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3878096207, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6180997641, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3695189488, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5604693026, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1633194828, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4068647645, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2487344417, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5459198725, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.1932983181, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.1032256991, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1630527, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4081053788, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2287219601, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4583168484, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1772765299, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4233964978, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1286198102, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.2975484349, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.0811728811, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.6549849942, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.8107475687, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.8725129388, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.9495292424, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5970228994, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7589201367, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.7389984312, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.860965653, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.8725129388, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.9495292424, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.5566206388, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.7291490644, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.200520325, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.502257785, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1507001023, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.411695047, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.2036163743, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1427349738, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3712417022, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.8253498773, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.8529564805, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.8253498773, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.8529564805, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1693721376, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4871671286, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3164918395, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5679185954, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.287558382, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5034550585, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.5556398916, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.6398624685, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.1424648973, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1304360687, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3571380358, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.4336378543, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.6642129647, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3424682602, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.6344653276, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.313708352, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5881287324, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.1012242353, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.2343905832, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5131983151, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7616672596, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5862368043, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.8099138444, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3563810735, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6446808198, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.1425546239, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.1995321605, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5875233938, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3754544247, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6063264858, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3640515625, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.632300052, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1596578751, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4786324898, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.1182124575, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0524702775, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3144455844, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4154571861, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7057846334, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3871258497, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6277405418, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2734805448, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6058485412, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.1956020486, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1254765121, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4561162618, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1981831978, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4925844813, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1605573917, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3888104634, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3254221548, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4089268375, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.0738663975, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.1467339554, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2822535302, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3978792053, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2833608714, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3843403302, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.280776323, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3806484184, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.1954287623, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.1725414554, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3590404023, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6708874697, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3022215252, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5984950448, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3541766522, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6033476632, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.1865188034, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.2953787279, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.307587447, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5072843332, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2248797177, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4257079532, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3934004457, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.0658487241, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.2573054579, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2812488198, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5745890808, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4486727666, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7186781719, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3832544339, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7040735112, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.1948126077, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1532614042, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4601298544, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.9243310584, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.9496062774, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2245659443, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4289339929, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1389213326, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3633674986, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3059402413, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.438474323, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.2489644619, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.2435440937, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5037410821, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7255032262, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4641860438, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.66667529, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.5063299741, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7202586379, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4001941056, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6211566792, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.2802116159, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5763419735, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1063732349, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4420365244, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3181038313, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1126934057, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4239791118, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.2365546515, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.3097227784, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4675640781, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6438637214, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.4456604653, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6390040126, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5844803971, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7020483558, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.2745094164, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5404614242, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.409202773, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6365177202, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3757600613, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5484260908, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3567235237, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4687499658, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.2416470723, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.3926015765, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.2467742829, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0794635782, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.2542451279, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.5030966277, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.680466091, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.4188516767, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5968056122, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.407638044, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5848678922, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.080256233, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3168464213, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1870854785, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4608359318, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.4012403951, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5502161218, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3987258775, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5864219777, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3949227611, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5964495195, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2844665636, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.1347404365, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4568041488, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6653973165, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.424340513, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5733777341, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4060507215, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5979247179, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1796268882, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3916632915, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2442590105, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4434063545, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4390212048, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.6475219955, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.3931152868, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.5586707455, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4376048462, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.6003954854, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1343765164, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3843406249, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.292024371, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.5503274886, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2356067382, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4505712028, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.186411773, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.41746732, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2081161785, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3954935034, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.2643902661, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0796382254, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3268028459, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3244721162, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5077210804, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2306619464, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4298903519, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2724173676, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4531095939, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0839296371, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.2714896999, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0845238055, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.2918197176, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.4459565225, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.6647029995, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0886800253, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2568222133, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0955980419, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2940646914, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1612831386, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3440984871, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1380046097, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3181131812, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.440035505, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5988144881, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.4391343776, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5999224498, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.217361275, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4284103162, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0218404908, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.115627302, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1951778697, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4646005812, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.5183632566, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.6705567849, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3129763613, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4993198489, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2892316007, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4768839853, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0965700538, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3135588343, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2101630852, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4169963033, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1512450377, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.487449587, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4499802275, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0794429423, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4267439859, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0595176787, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3079747172, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1406514456, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.412860687, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1506678365, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.448328585, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3055500359, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1247960547, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4551443068, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.1646901432, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2713884746, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1507754057, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4306402152, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3089070144, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4353286657, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.067595334, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3250818462, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0619430504, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3328924831, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.096979215, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4707628611, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4327654737, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1019390433, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4783734156, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3322570265, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3651320523, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4543944787, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4131432458, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3947542499, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.2390539104, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0517867867, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3432684678, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1551082905, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4231895808, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1862321334, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5228172023, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1270147783, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4033267379, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.206807738, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3413997135, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0616943831, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3642077907, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3673121627, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0359194689, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3024428691, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.1897072482, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.336862198, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1651856335, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4631382298, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4425672931, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0729309927, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3509917881, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.1214753612, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3675198977, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.107003545, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4848675989, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1616527688, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5185128505, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1144231004, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4385633678, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0493732122, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3372146907, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3955645311, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3410035629, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.6673519559, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2215037081, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.6073932835, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0103127151, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.0616562268, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1376687923, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4079222812, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1736846621, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4322849387, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.4561373145, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6655742412, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3664140352, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6156875253, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3510416809, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5257097928, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1402342404, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2959236501, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1990499617, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3534966827, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.5621669807, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.7520069792, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4383729772, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6543801046, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.3575978349, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6192927432, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2212146899, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4131481258, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2469537261, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4961446999, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.3562902191, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.6699423353, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2672991325, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.624013032, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0054491617, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.0261580293, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0922349333, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3046590495, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0847400568, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3322680661, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.3525333892, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6286864313, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2271273793, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5721925717, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0049961354, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.030698403, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.2297285043, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.116557507, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.313741991, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3572815261, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.6216765378, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1874538525, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4709873292, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.4162014036, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.592070527, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.074018222, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.2244203451, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1451596295, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3240520467, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3572815261, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.6309384943, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2467659506, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5348071146, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2571940113, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4967837111, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.1751807734, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.1884470229, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.5842771441, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.7733784586, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.5409623041, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.7430127527, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.6403647618, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.8633425886, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.5383002028, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.8276473976, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.9336510696, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.958650753, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.4531946634, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.7044338154, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3053838501, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.614283171, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0054491617, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.0261580293, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1379454665, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3950967796, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1801665025, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4094466587, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.4399465474, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5758276579, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3978536655, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5063642414, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2329989882, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3980073363, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1510957102, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.2485805445, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0686555147, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.2912548503, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1207269216, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3162144634, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1677739164, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2565892972, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1307118752, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2566872958, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0783884461, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.1974566447, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2263565415, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.6242817472, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.7056438934, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.7315339098, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.8175179632, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4390960898, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5382986509, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.2255844967, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.1809658013, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.6242817472, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7056438934, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.3571150501, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4963585573, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.3676041144, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.419852101, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1566391541, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.2725914793, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2201844821, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3372212279, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2252369759, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3876727889, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2252369759, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3626015527, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1240959712, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.2344817695, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1075467277, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.2565582172, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.1620970608, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.6230832294, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.70254087, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.458703244, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5232464635, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.4578226095, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5429809487, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.28273991, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2704657013, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3436358974, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.4516759457, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5169677928, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.4516759457, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5169677928, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3126851492, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.40158087, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2521432424, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.317135213, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.053395131, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.1432217833, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.4516759457, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5135242648, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2403479326, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3290984948, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2809128259, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3881602965, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.0703293477, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1159507116, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.23225723, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.6242817472, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.7056438934, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3978610451, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4980599039, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1692569703, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3070346644, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.197875065, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1180286135, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2474367452, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.445513857, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4044449962, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4418719444, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4034042753, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4146768169, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.4615425016, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.7427658454, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6057091247, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6546258442, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.1534697291, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.515565124, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4384930066, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4425973012, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4483037848, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4483037848, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5082803455, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3981852532, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3830425593, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3981852532, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3835863005, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.2686778755, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.3113878808, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6728506998, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6417603075, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6546258442, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1667955161, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5795544193, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5064818122, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.5303624596, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7835371348, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4699822121, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4699822121, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.2540637884, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.27584557, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5310543174, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4216875815, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4833500875, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3099391219, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3804480402, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2014941616, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5931139543, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2724974523, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.6760199025, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5335249134, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.220501041, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.2125763546, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5141209056, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5079329665, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5141209056, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5773063191, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5774060819, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.328251853, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.6453010665, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3294164636, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.7004719342, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2087037147, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5493435887, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2311466382, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5766355254, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0629710366, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.383611695, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.6888365053, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.8656273481, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.5091224919, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.7829685247, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2597064971, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6087618281, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1513630224, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3848617015, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0909379867, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4398085115, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.6912804408, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.8416888527, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.8522456714, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.9096914044, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.8522456714, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.9096914044, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4085639059, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6786065713, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2112648086, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5603202945, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.7196315267, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.8835331637, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.5465526716, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.8012679277, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.546149954, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7954823724, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4451075766, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.6955301379, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4454357881, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7513336774, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.6383964846, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.815515317, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.357102986, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6375235254, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.3453786558, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6205376126, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1910722296, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5057577708, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.3403336518, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5950884702, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.4818114945, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7046532915, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.4818114945, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7046532915, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.4145247088, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7104231206, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.2537184041, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1619557013, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4640690459, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3917444023, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.6762795188, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3124325728, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.6722343255, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.4523474723, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.7277271274, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1140842452, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3629959771, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1038988938, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3748538161, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.6004981752, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.7274351792, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.637202263, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.7346216973, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.4523034717, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.6737381483, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.27444079, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.2099268349, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1673872929, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4506667273, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.310088227, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.310088227, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.310088227, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.310088227, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2404786079, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5819897904, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3851341467, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.700571373, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2404786079, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5819897904, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2404786079, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5819897904, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.4222184785, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.6656008733, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.6173766801, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.8573900401, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.5609383777, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.7973683101, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.5040253502, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.7254592658, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.228768444, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3953738393, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5370988256, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.213387489, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.6034116936, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4359493825, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.7673284019, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5582775803, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4135171, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.7555530032, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4206173028, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.5967384019, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.8544348081, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.6507561417, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.8215788698, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.6507561417, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.8215788698, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.6507561417, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.8215788698, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.428494509, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.7246227738, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.428494509, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.7211812033, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1328002272, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4983488136, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.429848247, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7369844405, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.429848247, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7369844405, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.4899456142, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.8020845126, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.1602417931, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.2524720088, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2962789157, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.608714571, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2500966497, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3829228358, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3581864018, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.7236278104, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3581864018, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.7236278104, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3581864018, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.7236278104, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3619308441, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0514276487, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.3763953327, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.4812700338, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.7668482136, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3258816485, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.7240768473, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2622470152, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4590143917, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1553586215, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3726937394, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0853874742, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.2903017692, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0210266314, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.1004122321, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0605813979, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.2708928603, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2556422229, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4291463251, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1520832336, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3357817921, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0555078283, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3017380756, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0145373511, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.1137647864, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0125133478, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.1667129052, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2535787382, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.457896662, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.136763833, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3930270089, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0626565443, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3103961933, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.1382368241, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.059936325, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.2480370686, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2487984732, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4808459302, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1119004718, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3207756555, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1770079985, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4251640447, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.1065437287, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0506326413, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.2063157538, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2706589649, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4576310781, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1801847412, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3788121735, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1942705885, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.393160027, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0148442215, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.0951738246, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0505279112, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.210149811, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2134127737, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3993267196, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1370723839, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4184465202, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2082125697, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3626252612, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.098281743, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0590176545, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.2239028811, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2040584432, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3869788846, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1422383967, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3372144194, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0726142466, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3123933214, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.0744097162, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0450397011, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2455593932, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2249382218, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.435607309, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1747178289, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.355405822, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1089629302, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.311102417, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0175405257, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.0987376214, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.1892957231, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2488464414, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4890540555, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1726437399, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3735954911, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1276861358, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3395298581, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.1023492205, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2762431573, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3081587575, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4611100423, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.431864811, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5525904593, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.5892468541, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.6366953113, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.1463211076, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.1480582994, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3931991983, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5762809938, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.4220833561, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.5979768974, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.5350934112, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6604901008, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.1578662314, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.1129182824, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.2586362605, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5016232721, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.3098590148, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5482494608, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.303164724, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4588723411, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.1398026485, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.1723211496, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.3424885276, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.5683099371, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4908217883, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.584120706, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.3132694642, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4732494916, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.1128669107, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.1739698084, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.3440134693, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.549589855, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.6206693056, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.7568146072, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.6827816739, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.7764983343, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.0842567347, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.1973749021, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.4194435452, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.6003681414, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.5801271254, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7044697964, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.4655582025, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.6503339718, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.1417880654, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.1431664216, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2607117486, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4104518639, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.272451774, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3994749502, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.267803949, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4240591651, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.1524375046, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.1644772457, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3128076344, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5182772142, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.4149070931, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5200674066, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1787993588, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4225521949, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.1554990916, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.1243889412, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2329218076, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4655700551, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.4862041607, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.566690507, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.4578146014, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.564811613, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.1893317245, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.1901591937, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3814061362, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2297430099, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4387133834, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.3067435429, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.291522149, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.2957480013, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1579537051, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.430134848, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.304476733, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.2004324583, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.1086582496, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.1806767196, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3693695134, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1176345357, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.2925508456, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3073616767, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.2670896193, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1837134362, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4297917347, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3486134996, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1631849581, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.326150029, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3084506163, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2627460647, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4328065186, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2638548135, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3672497643, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.3108512602, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6363359373, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.4323876064, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.8055359641, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.886602904, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.9278293769, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2825389301, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.5344527157, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.212432413, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.365696558, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3215134657, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.1014090185, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.1234840549, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.2692774259, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.4179412848, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1560665245, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2770325989, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.2996949022, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.1001372506, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.1625690111, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.2825389301, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4976525037, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1270642199, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.2440075668, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.103339841, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.286598559, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1043436098, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.2304702266, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0924171382, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.2574240007, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2464198596, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.3656201333, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.125778296, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.1786140394, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.1987361101, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.1160604142, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1732519609, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.2589707148, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3894763383, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6458478419, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.37091868, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6391351243, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4154129291, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6551586606, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2632215534, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5349093488, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3691596262, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6148019953, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4932917922, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7250812194, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.5425782644, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6842899817, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.5050320102, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6767890223, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.1158794317, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0795969907, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4508254633, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.4358580014, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.7739155888, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3725685851, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6793633737, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2988693281, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6737618245, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1157312031, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5372702899, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1613918211, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.595721186, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.5045866834, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7432853994, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4756695859, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7418637036, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4334817334, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7171116207, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2050725622, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5426869695, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2896892505, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5930620043, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3318040043, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5104370577, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3507080155, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.530639559, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3103314868, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4793429149, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1691736358, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3548723954, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2576216193, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.419004884, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2855538302, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5913739539, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2647341117, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.517820911, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2344231337, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5275347524, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0973747752, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.2315623244, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0968875821, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3837084677, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2561427664, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.459258318, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2375796998, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4505198894, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2171548434, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4709185497, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0911030624, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3176666445, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.075181772, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3276426117, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2400005785, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.6324601535, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0809614605, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4449910499, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1728300232, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5002768449, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.2749055998, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3726637878, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4409737058, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.7155893246, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5502972491, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.7372824427, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5065640727, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.7393595983, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.2029140971, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4486025295, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.29273037, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6150714044, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5733962624, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7116531771, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4271477483, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6354195574, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4625123206, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6509807296, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.237281279, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4382445666, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2648541006, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5024165837, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.5611598962, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7539020133, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3457318869, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6817029798, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3405167442, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6563835876, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.0606126075, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4091252276, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3728937116, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6577808114, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2974073493, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5830927064, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3250777038, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6245400082, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0771850833, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4162271381, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2551081867, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5871389811, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6696221279, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7575888913, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6413060773, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7264963132, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.5479209488, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6582463921, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3321412317, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5747428897, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4072350447, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6300067107, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2863916568, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4033306935, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3216042915, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4309767197, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3148906208, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.426492351, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0846356642, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.1473307203, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1552796518, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3330096252, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1243048054, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4188895923, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1446970285, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4460940289, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0871307032, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4165249375, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.130542673, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.2820267618, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.4261391764, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.6170683508, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.3933372499, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5497639692, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.3933914801, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.533822576, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.0642986259, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.2214848996, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2211171724, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5855191906, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1468792836, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4961191884, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1859723721, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5322764543, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3246899311, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3100498117, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3345749807, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4948403657, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3755133068, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5382122955, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4440522294, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6063305672, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.1885744065, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.401688874, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3706284524, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4903054058, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.1574644094, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.2757258739, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3379740275, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5024415462, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2177684253, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4326933291, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.1653718418, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4021366715, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2866736814, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.511205425, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4190701615, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5756418081, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3875233761, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5087692893, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3545355532, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4920924348, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.016481562, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.1042780617, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3216581105, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4367200228, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.599582244, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.744661685, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.5624634855, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.7208214628, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.5046747712, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6485787221, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.4015453155, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5765093529, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3716332024, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5997893915, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.5417389235, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.642433719, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2270898641, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4268311768, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3111562562, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4587576527, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4034278346, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4659288646, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.1651403714, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4038726312, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.4012715809, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5569332816, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2173289398, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3748471244, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3108464845, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4100147538, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.1663639341, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1021604171, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2824944882, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3435591481, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.496882135, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1877972313, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4167571671, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.248567001, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4381394216, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.048591157, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.2382129689, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0495180896, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.1886035546, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2245209743, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4694055398, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1208502583, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3124167475, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1066160676, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.294016662, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.068580961, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.1852040732, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.097526568, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.1646244729, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.5842771441, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.7733784586, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.5409623041, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.7430127527, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.6403647618, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.8633425886, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.5383002028, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.8276473976, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.583568612, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6699263395, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4504787314, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6272454245, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4521483403, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6093451568, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3492781465, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4383491029, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.2831085292, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4576463253, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3448578743, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4669543574, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4500973764, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4383397526, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.1765846538, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.3452556465, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.1411119238, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.1107656147, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.5319381818, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7292642796, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.434286966, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.2405939782, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.2482362812, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.6025268807, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.7756526381, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.5775400217, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.775981567, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3420788649, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.7981885823, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.2221602357, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.2927793623, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6187129112, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.783347898, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.446338868, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7206547449, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3132060554, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6780959222, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.2248477066, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.1638003754, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3510762437, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4001039485, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2538209236, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3065410614, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2636758063, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3333208049, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.1029834289, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.0642319091, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.8413544004, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.9005264466, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.6978499535, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.7680111715, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.8037775081, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.8813855605, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2310325762, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3824279168, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2018356447, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3979134817, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.5556495621, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5724214108, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.7228204707, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.7113746849, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.3676041144, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4694590303, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2255489037, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.33145819, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2087266913, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3323623292, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.3619174049, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4683222931, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1966781229, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4099446715, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1966781229, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4069323584, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.2428367901, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.280095132, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5096772803, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6511024508, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5096772803, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.642751012, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.2978735711, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6380558649, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.1174603506, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.114788761, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5322520826, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7271316675, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3535749731, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5088037626, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3622547792, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4949023339, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.353991485, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.1709269924, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4589403856, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.5675311466, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7445312763, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4275362732, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6105526571, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.45617777, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6731126316, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.2517782992, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.2779306146, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.5089175115, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.7277035121, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.4183007446, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6688763364, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3892727054, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6989587493, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4188661445, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5586915231, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.287558382, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4932995367, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.318581008, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4738374872, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3321678143, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4723826766, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.1173952179, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4256923177, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2453318866, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.494452768, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3619174049, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.545884109, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.6666467303, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.6471929786, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2428791292, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.241333176, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2338135382, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3427235649, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4081747281, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3774510451, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1318131343, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5386041399, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.232250537, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1120375434, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4030209467, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1432450176, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3826571896, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3318900486, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1081559373, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3191612091, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.2792531022, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.148088719, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1677739164, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4046828129, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1627690506, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3948411498, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1117554475, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3627168098, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.233665254, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.222018981, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.341191474, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5117673951, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3725748409, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5400450497, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.2288355035, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5836260855, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.2671273299, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.1381779039, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.3144154095, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.6769906826, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.8083906073, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.1739898488, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5216901259, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.189602679, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5147057623, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5199744507, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3883058592, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6037425262, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.5106109398, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7688046995, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.5106109398, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7688046995, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3952355242, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.7537413929, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.1926916667, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5214226503, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.5088645485, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.8116199676, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.4075584824, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.7803434177, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.33828653, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.7321312284, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.6535194995, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.8909391457, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3055117238, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6522327841, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.657716091, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7714634548, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.8151678596, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.8873630456, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.5114981214, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6207619434, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4962806188, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6985190396, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6153267327, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7220474571, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.368224131, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5518218099, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2479866826, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2635199569, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.368224131, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5606184355, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.368224131, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5606184355, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2765950321, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.42374983, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2615311775, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5017688443, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4369322371, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3468012291, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.1501349739, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.1754918305, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1600872496, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3565190644, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3088522099, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2666066054, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.483406879, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.2558006851, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.1867041258, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.3079852791, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.6801949008, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.3719278006, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.6892896282, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.3075261697, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.6821513697, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3036431152, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.2601611411, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4572935209, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.453655627, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4475397629, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4422069076, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4847458184, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4165767637, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5728095918, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4360038791, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5748585174, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.8318180062, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.8641903026, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3140382294, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5631437829, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.7498810286, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7726337965, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3723091903, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6028889976, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2103407319, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5878781611, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3299895473, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6337904872, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.2685563379, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1633194828, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3775551867, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3550420051, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5693079918, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4596307297, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3550420051, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5693079918, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3346449427, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5058892672, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1799107865, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5159811845, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6486932415, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7886867104, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6486932415, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7886867104, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3623885503, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6212681812, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6486932415, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7886867104, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4601221425, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6704634783, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.6617520153, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.7140739801, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.544786716, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.6078540955, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.4938015542, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5654925887, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.6068655708, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5901094922, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.4715479868, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4598255389, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.4772349067, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.6979552346, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2484529356, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5252866054, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1785403228, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4266196503, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.1723303147, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.2684009711, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.6169034543, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.6942951271, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.4706365972, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5660330383, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.3787865613, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5426085574, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.2175881063, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.320023968, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.5874688341, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.7953606598, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.4477218071, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.7608597891, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.4376250019, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.7561867704, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1656558577, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3855427495, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1143480002, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.271581121, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.6102624547, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.7455382911, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.6102624547, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.7455382911, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5129914365, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.67190581, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5815025407, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.7086281431, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.1755427274, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5197819745, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7056405694, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5272145166, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6984559479, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5424690782, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7222670487, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.1226967111, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.2848321926, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2440186706, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4385803078, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2721148714, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5914641898, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2686079606, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5123463581, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.2486866475, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5361155849, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.0477462923, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0650846084, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.312718884, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.4295114388, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6901398329, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.4548004572, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.7465606836, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3416682036, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5929379454, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.243147273, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2203442568, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4361275433, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4026021376, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.665169776, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.5474706069, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.804473729, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.5035012366, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7089119315, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.2574911931, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.1435358442, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.381181164, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2079088715, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3457623435, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1945816843, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3334872222, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1561403285, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2994402838, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.034321633, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.0237913545, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.4276676633, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.6775603101, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.4028188935, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.6269035793, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2176252352, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5559852813, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.1549577496, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.1007849149, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2126034365, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.550826234, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2599744756, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5252318414, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2692827691, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5550492924, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.1134563932, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0774386122, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.2515823082, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.3400426546, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5690760098, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2783592722, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.528002244, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2796257611, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.525801232, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.0421968801, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0555746239, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.2524744935, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.4416699547, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6991837934, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3681388127, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6663751332, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.2922076174, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5600839481, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.0256032267, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.3027682064, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.264926859, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5168400513, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5198707242, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7322317271, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4774025962, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6612122474, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.1648348642, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.1555238526, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.4229385542, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6398920453, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1943067625, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5171544283, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1986382491, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5627974274, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.1968712517, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.2651822046, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.371586245, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6081420532, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2302096976, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5280846549, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2791742968, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5541020626, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.1500779341, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1958598295, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.4310121274, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4256512186, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7373776069, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6142322395, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.8267772572, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4622377024, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7573830179, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.2035623697, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.0986563752, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.3583887259, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2704817076, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4345032238, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.196922159, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4873983653, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3954512194, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4398570288, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.128166123, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3086389171, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2796471531, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3532162042, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2852994464, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3535144994, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1967705363, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3013882733, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.0934005227, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.1851444607, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2398099817, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3657849257, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3799401898, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1910518236, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.401101831, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.1757942889, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.1830641485, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2424855109, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5394338001, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.2871244623, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5130086721, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.3357306484, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.6709968513, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.1522614513, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.1924681542, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3603212181, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.7061680908, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.2242667364, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4850454299, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.357102986, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6503106787, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.139477842, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.3768843305, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5038203949, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7121763619, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2391817842, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5705865378, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3245246551, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5884909164, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2080764279, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5713091082, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.1909296489, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5434160556, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3330192772, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.6227994573, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.171079793, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.5862164742, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1321324457, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4887630789, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.2663395431, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3305068265, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3931991983, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6611329021, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2481723264, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5569707664, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3245592827, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5310900771, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5014855896, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.2031552942, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5421921966, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4574614318, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5874857498, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3979308132, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5730947029, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3386685756, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5469381479, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.1342798256, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4444394912, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.286157866, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.5609620177, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3108512602, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.6363359373, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.4323876064, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.8055359641, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.886602904, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.9278293769, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3189158022, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5488981549, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.101560137, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.4127375186, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.1334305541, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.3549510356, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.1313899161, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.2809569646, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4169434378, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.309072299, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.108561755, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3852135209, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.2965802809, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3024415044, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1977072463, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5083591787, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1307201098, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.448486347, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1115815139, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4299586248, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3110937359, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.2201061386, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5270846788, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.137942361, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4696516496, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3304476399, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.5342728014, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.4878555885, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.3397655986, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":0 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":8 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-2.0-flash-001", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":1.0, - "sentence_nr":9 - }, - { - "model":"gryphe\/mythomax-l2-13b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"microsoft\/wizardlm-2-8x22b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.3966517116, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6126466913, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3475853602, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.541459987, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.1822361224, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3997108494, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2720948138, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4835271066, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.4178188084, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5837393615, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3695995811, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5711056847, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0000000919, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.0431986714, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.1853464136, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4093242023, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0000000919, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.0362915397, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.2844302564, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.5121261928, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1745431492, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4088014664, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3412793714, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5566337161, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3504957829, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5420312731, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0969972045, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.4832107456, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2419830598, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1320718304, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.4415333367, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1398771832, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.3965032466, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4033978306, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1228715408, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4146285797, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0736272693, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.4084116518, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.2131242166, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.4821428819, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.434159348, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0880200868, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3115909203, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1521784384, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.4592008131, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.220619756, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4664938153, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0795221213, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3724723155, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1198269585, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.4593235483, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1814484996, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.495978943, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1521582017, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3251295716, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.2430376937, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5225794823, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.151865293, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.3218574497, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1546331303, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3246079335, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.2646434905, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.2625161534, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4838334557, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.1642160313, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.3214389849, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1931815248, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.4763864029, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.6070689912, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.7305039391, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3326486375, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5883890967, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1821686983, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.302972981, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.1702602472, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.3050713984, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1013606811, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.2880515365, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2679974277, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5619147668, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.1210366914, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.3122915915, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1863706774, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.2898682628, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1909881176, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4357592029, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.2512201351, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3613480005, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.6256538562, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.6943310522, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2636438825, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5375272791, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.1406853565, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2342066897, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.388441382, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.4874443082, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0674159976, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.1065354986, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.264926859, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4024071085, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.357914128, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4554915707, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1714562241, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.2743526917, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.3730786951, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.4157762304, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.6290393497, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.1536220823, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.5798536462, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.33598634, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.3519556829, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.4784253622, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2680165156, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.611921685, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.435050222, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.2460137258, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6869474337, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4030945868, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.3081599032, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.4148296419, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.4050845737, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2369305576, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6474126202, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5384586523, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1718152967, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5257017186, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.611895563, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":1.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.4451075766, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.7334918117, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.4818114945, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7675828789, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1990581597, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6133817758, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.2704091954, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6207272323, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.5465526716, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.8012679277, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.3335910323, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.7011023633, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.3207873973, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.5817366082, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3485799123, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6090575372, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2810335396, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.605156453, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.2445665611, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6642691959, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.691790174, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.8479928839, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.546149954, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7954823724, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.4194685158, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.6582292681, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.546149954, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.7954823724, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.3857587082, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.7029566282, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.1753767087, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5886202682, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.1673872929, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.4506667273, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.7511573913, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.9453473544, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.1946452196, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.5838790967, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.5014756678, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.7958858212, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.3236579503, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.6509517796, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3236579503, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.6564314769, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.3236579503, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5875876275, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.2319821043, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.6307116012, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.3226386416, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.6824395077, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4184379522, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.6995568307, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.2404786079, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.5819897904, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.373921491, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.6536082905, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5512324462, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.4881010345, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.7317734492, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.2719326877, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.5963825615, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.2445665611, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.6532234058, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.447872232, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.7968980207, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.3581864018, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.7236278104, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.3167161501, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.67827349, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.1301048539, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.3149300382, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1648468485, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3917558573, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1130729983, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.3688031545, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0004488418, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.089305888, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0532360836, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.2211046787, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.1807114774, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.3631407688, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.3378903234, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.5556453958, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.4021850735, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.5369243982, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.0262909263, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.4630917652, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.5360107471, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.3957264202, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.4958499678, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.3168900267, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4217762086, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.4372110759, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.5492872921, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.1328643776, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.3043418817, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.1773973124, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.3761627808, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.4359682535, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.5243661809, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.412806204, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.5196214432, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.4244459417, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5176629059, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.0826435439, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.2093360771, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"bleu", - "score":0.1478824915, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_from", - "metric":"chrf", - "score":0.3273983783, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_from", - "metric":"chrf", - "score":0.0231778896, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"bleu", - "score":0.1255213133, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_from", - "metric":"chrf", - "score":0.4194221711, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"bleu", - "score":0.1004077623, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_from", - "metric":"chrf", - "score":0.2293820934, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_from", - "metric":"chrf", - "score":0.0809100044, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5670546248, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7791227967, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3457410059, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3692590781, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.8590406918, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.8985766779, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2697790305, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6173213845, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.6649820533, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.7856446622, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.3073041537, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.514597811, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.0238287164, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.2644118551, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.106319927, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.3651947098, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.508272955, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.7319355475, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3825696797, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.7134549338, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.0311091903, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5402189689, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.7688675864, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.4659704405, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.7247463228, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.360581731, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3933076922, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2234503775, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5073212179, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.5200746238, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7143812917, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.5723092813, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.7320823035, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1411183069, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4499767499, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.6420242161, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7826629559, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4070089443, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.6333591104, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5192292045, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6435810884, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.3524295891, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5231782615, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3329929683, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5456708438, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3686682677, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6614268294, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.5774196213, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7322219196, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.4009086918, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.4217036033, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.4099353599, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5371786113, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1357102688, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4956509438, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.5145070028, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6293403102, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.726000182, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.8743307224, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.596698202, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6815230707, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.5725251534, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.7101534059, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1820705281, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3864538215, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.6095027193, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.7656473896, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.3647817968, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5699896912, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3445364014, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.632120037, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.3090310267, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.569470872, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.529550285, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.7216225504, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6527019935, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7749889271, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0188098832, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.1599510106, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.3255999378, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5232900687, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":1.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.8107492451, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.9000327478, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.0748774416, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.6885326215, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.8328652216, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.2052212051, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5594940673, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3907228334, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.6344060552, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.4815092082, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5613602982, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4276082873, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6536913951, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.4298810543, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4705032487, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.8595328139, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.9098840135, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.3022867927, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4457424291, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4761839369, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3034491157, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6798106213, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.4466679874, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7283431044, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.2217572794, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.3958828105, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.3965384288, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5702892011, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3187271473, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.3811308672, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.4687776643, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.4517409273, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.3734470176, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3820562307, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.5488313413, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.2308824748, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.4447723693, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2862085038, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.3823890695, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.2756333028, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.3993831713, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1860501646, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4434360695, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1567750617, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4928652815, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.1282491921, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.2524884798, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.4599996071, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6267974727, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3200938205, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6393945963, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3782727845, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6480161649, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.2031205438, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.3026286473, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4799233253, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.3451314769, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.1790037085, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.2910454983, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3568630983, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2330781491, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.6295171818, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4819511629, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.7170281746, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3500851741, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5415801306, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.4093184131, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.5715958346, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.8330787011, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.9482515348, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1475758119, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4819243515, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3464821641, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.5903354473, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.0473282084, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.4899417818, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3996617914, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.4470161785, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.8350256155, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6848075777, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.799139523, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.1788973419, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.406447761, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1310249598, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.3785744421, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.407135992, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.7697196337, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.2858565969, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.5971070986, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.8874294966, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.3117732724, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.3089525776, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.0088652482, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.3124325728, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6024486188, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.1705746719, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4261710812, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.7181417753, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.8029162546, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.1782921966, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.4892059806, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.5894159589, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.7585081366, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2672825521, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5947619308, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1560424227, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.4948804416, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1625677471, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5039740897, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.6486932415, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.7887116805, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.6651557977, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.7107545146, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.3678169128, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.6159870046, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2572396203, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.6032951031, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.231344208, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5732050784, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.2519262872, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.063462015, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.127127955, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.0112017261, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.256949594, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.3776963602, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.5392238315, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.4112296795, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.6173246841, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.304228848, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.6437766898, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.2489022408, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.5809139399, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.5366186003, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.6886178182, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.0977620571, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3509809637, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.2329143346, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.5597013067, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.2877266359, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.5452950559, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.2585518999, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.3445778904, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.663098603, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"chrf", - "score":0.1941642461, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.3049195653, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.5730973226, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.3715079739, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.2377842957, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.4090777522, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.4478039778, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.702731981, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.1587667047, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.4627609227, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.4467367036, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.5702658069, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2910873659, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5097137744, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.1163327084, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3968305235, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3818878183, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.6843771196, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.3528360454, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.6592215569, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.3480877155, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.5371325399, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.1185099796, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.4011805746, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.245369104, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.5145398706, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3538049407, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6079597827, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", + "model":"openai\/gpt-4o-mini", "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"bleu", - "score":0.2931266115, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"translation_to", - "metric":"chrf", - "score":0.4957483698, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"bleu", - "score":0.4748202049, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"translation_to", - "metric":"chrf", - "score":0.6389166442, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"bleu", - "score":0.1760482971, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"translation_to", - "metric":"chrf", - "score":0.3966935539, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ur", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"bleu", - "score":0.3624420094, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"translation_to", - "metric":"chrf", - "score":0.5744562766, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"bleu", - "score":0.3885590147, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"translation_to", - "metric":"chrf", - "score":0.6291913508, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"bleu", - "score":0.353938227, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.4709266199, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"bleu", - "score":0.2808746698, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"translation_to", - "metric":"chrf", - "score":0.5644076652, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"bleu", - "score":0.112642965, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"translation_to", - "metric":"chrf", - "score":0.3755118765, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.1869886574, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"translation_to", - "metric":"chrf", - "score":0.5064678234, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"bleu", - "score":0.2212749443, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"translation_to", - "metric":"chrf", - "score":0.4521129355, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"bleu", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"mr", - "task":"translation_to", - "metric":"chrf", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"bleu", - "score":0.1918957007, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"jv", - "task":"translation_to", - "metric":"chrf", - "score":0.4759856856, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3113701869, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.55946099, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":0 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":1 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":2 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":3 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":4 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":5 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":6 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":7 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":8 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 - }, - { - "model":"qwen\/qwen3-235b-a22b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.0, - "sentence_nr":9 + "score":0.3184321553 } ] \ No newline at end of file