| [ | |
| { | |
| "language_name": "English", | |
| "bcp_47": "en", | |
| "speakers": 1636485840, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.4351349353198866, | |
| "chrf": 54.9504915580248 | |
| } | |
| ], | |
| "bleu": 0.4351349353198866, | |
| "chrf": 54.9504915580248, | |
| "commonvoice_hours": 2649.0, | |
| "commonvoice_locale": "en", | |
| "population": { | |
| "AC": 931, | |
| "AE": 4996040, | |
| "AG": 84434, | |
| "AI": 17186, | |
| "AQ": 300, | |
| "AR": 3183537, | |
| "AS": 47954, | |
| "AT": 6467398, | |
| "AU": 24447840, | |
| "AW": 2986, | |
| "BA": 1726016, | |
| "BB": 294560, | |
| "BD": 29277180, | |
| "BE": 6915213, | |
| "BG": 1741725, | |
| "BI": 6289, | |
| "BM": 66010, | |
| "BN": 7896, | |
| "BR": 16937280, | |
| "BS": 337721, | |
| "BT": 86055, | |
| "BV": 1, | |
| "BW": 1876956, | |
| "BZ": 399598, | |
| "CA": 32416926, | |
| "CC": 101, | |
| "CH": 5126434, | |
| "CK": 8574, | |
| "CL": 1727746, | |
| "CM": 10543100, | |
| "CN": 62731, | |
| "CP": 1, | |
| "CQ": 482, | |
| "CX": 1389, | |
| "CY": 924676, | |
| "CZ": 2889675, | |
| "DE": 51302208, | |
| "DG": 495, | |
| "DK": 5047693, | |
| "DM": 69788, | |
| "DO": 7980, | |
| "DZ": 3008103, | |
| "EE": 614310, | |
| "EG": 36443400, | |
| "ER": 3587908, | |
| "ES": 12003792, | |
| "ET": 46488590, | |
| "FI": 3900169, | |
| "FJ": 879816, | |
| "FK": 2814, | |
| "FM": 58389, | |
| "FR": 26460798, | |
| "GB": 64445878, | |
| "GD": 108570, | |
| "GG": 67052, | |
| "GH": 6161442, | |
| "GI": 23665, | |
| "GM": 869600, | |
| "GR": 5409621, | |
| "GS": 20, | |
| "GU": 153321, | |
| "GY": 750204, | |
| "HK": 3697454, | |
| "HM": 1, | |
| "HN": 40635, | |
| "HR": 2071598, | |
| "HU": 1954366, | |
| "IE": 5073039, | |
| "IL": 7374158, | |
| "IM": 90499, | |
| "IN": 251957100, | |
| "IO": 3500, | |
| "IQ": 13605445, | |
| "IT": 21216918, | |
| "JE": 96019, | |
| "JM": 2752399, | |
| "JO": 4869270, | |
| "KE": 10170301, | |
| "KI": 111796, | |
| "KN": 52745, | |
| "KY": 60705, | |
| "KZ": 2863785, | |
| "LB": 2187844, | |
| "LC": 149838, | |
| "LK": 2288920, | |
| "LR": 4210839, | |
| "LS": 531719, | |
| "LT": 1037955, | |
| "LU": 351893, | |
| "LV": 865366, | |
| "MA": 4978638, | |
| "MG": 4852026, | |
| "MH": 72463, | |
| "MO": 14133, | |
| "MP": 49890, | |
| "MS": 3492, | |
| "MT": 402395, | |
| "MU": 993146, | |
| "MV": 293928, | |
| "MW": 13353858, | |
| "MX": 16724500, | |
| "MY": 6856941, | |
| "NA": 184105, | |
| "NF": 1678, | |
| "NG": 113434840, | |
| "NL": 15552360, | |
| "NP": 909837, | |
| "NR": 9350, | |
| "NU": 1120, | |
| "NZ": 4826970, | |
| "PA": 545171, | |
| "PG": 3629730, | |
| "PH": 69875840, | |
| "PK": 116750500, | |
| "PL": 12633159, | |
| "PM": 187, | |
| "PN": 46, | |
| "PR": 1562644, | |
| "PT": 2781729, | |
| "PW": 1887, | |
| "RO": 6603899, | |
| "RW": 1906860, | |
| "SB": 685097, | |
| "SC": 36473, | |
| "SD": 27792576, | |
| "SE": 8774150, | |
| "SG": 5774984, | |
| "SH": 5425, | |
| "SI": 1240581, | |
| "SK": 1414556, | |
| "SL": 2318726, | |
| "SS": 2851524, | |
| "SX": 29816, | |
| "SZ": 883584, | |
| "TA": 272, | |
| "TC": 54807, | |
| "TH": 18623898, | |
| "TK": 1285, | |
| "TO": 29707, | |
| "TR": 13942975, | |
| "TT": 1063735, | |
| "TV": 1066, | |
| "TZ": 40401432, | |
| "UG": 1686867, | |
| "UM": 316, | |
| "US": 319333440, | |
| "VC": 97334, | |
| "VG": 36633, | |
| "VI": 79676, | |
| "VU": 247616, | |
| "WS": 4279, | |
| "YE": 2689596, | |
| "ZA": 17503716, | |
| "ZM": 2788256, | |
| "ZW": 6109446 | |
| } | |
| }, | |
| { | |
| "language_name": "Chinese", | |
| "bcp_47": "zh", | |
| "speakers": 1304678914, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.3977775857451761, | |
| "chrf": 57.672913792439125 | |
| } | |
| ], | |
| "bleu": 0.3977775857451761, | |
| "chrf": 57.672913792439125, | |
| "commonvoice_hours": 422.0, | |
| "commonvoice_locale": "zh-TW", | |
| "population": { | |
| "AU": 534796, | |
| "BN": 51093, | |
| "CA": 678494, | |
| "CN": 1254618000, | |
| "GB": 197283, | |
| "GF": 4988, | |
| "HK": 7249910, | |
| "ID": 2456639, | |
| "MN": 44352, | |
| "MO": 632892, | |
| "MY": 5550857, | |
| "PA": 5841, | |
| "PF": 23019, | |
| "PH": 797021, | |
| "SG": 4781438, | |
| "SR": 6705, | |
| "TH": 1241593, | |
| "TW": 22422850, | |
| "US": 2295209, | |
| "VN": 1085934 | |
| } | |
| }, | |
| { | |
| "language_name": "Hindi", | |
| "bcp_47": "hi", | |
| "speakers": 546882144, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.333521621016373, | |
| "chrf": 50.48364584189306 | |
| } | |
| ], | |
| "bleu": 0.333521621016373, | |
| "chrf": 50.48364584189306, | |
| "commonvoice_hours": 16.0, | |
| "commonvoice_locale": "hi-IN", | |
| "population": { | |
| "CA": 188470, | |
| "FJ": 411829, | |
| "IN": 545022990, | |
| "NP": 127377, | |
| "UG": 2206, | |
| "ZA": 1129272 | |
| } | |
| }, | |
| { | |
| "language_name": "Spanish", | |
| "bcp_47": "es", | |
| "speakers": 493528077, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.29160032861883095, | |
| "chrf": 47.668399832701844 | |
| } | |
| ], | |
| "bleu": 0.29160032861883095, | |
| "chrf": 47.668399832701844, | |
| "commonvoice_hours": 446.0, | |
| "commonvoice_locale": "es", | |
| "population": { | |
| "AD": 33110, | |
| "AR": 45479100, | |
| "BO": 7100339, | |
| "BR": 76218, | |
| "BZ": 111887, | |
| "CA": 603106, | |
| "CL": 17823064, | |
| "CO": 45648864, | |
| "CR": 4843090, | |
| "CU": 11059100, | |
| "CW": 5751, | |
| "DE": 4809582, | |
| "DO": 8189766, | |
| "EA": 147000, | |
| "EC": 16228704, | |
| "ES": 49515642, | |
| "FR": 8820266, | |
| "GB": 5260888, | |
| "GI": 14790, | |
| "GQ": 727475, | |
| "GT": 15952569, | |
| "HN": 7203565, | |
| "IC": 2056618, | |
| "MA": 23115, | |
| "MX": 106779500, | |
| "NI": 4838683, | |
| "PA": 2686915, | |
| "PE": 23297950, | |
| "PH": 33846110, | |
| "PR": 2774491, | |
| "PT": 1030270, | |
| "PY": 230134, | |
| "RO": 2130290, | |
| "SV": 5768179, | |
| "SX": 4823, | |
| "TT": 4110, | |
| "US": 31933344, | |
| "UY": 2981097, | |
| "VE": 23488572 | |
| } | |
| }, | |
| { | |
| "language_name": "Arabic", | |
| "bcp_47": "ar", | |
| "speakers": 351664197, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.277257629790728, | |
| "chrf": 46.62779335380641 | |
| } | |
| ], | |
| "bleu": 0.277257629790728, | |
| "chrf": 46.62779335380641, | |
| "commonvoice_hours": 91.0, | |
| "commonvoice_locale": "ar", | |
| "population": { | |
| "AE": 7793822, | |
| "BH": 1309350, | |
| "CA": 565412, | |
| "CM": 108206, | |
| "CY": 1267, | |
| "DJ": 67292, | |
| "DZ": 31799946, | |
| "EG": 97876560, | |
| "EH": 652271, | |
| "ER": 297979, | |
| "GB": 197283, | |
| "IL": 1735096, | |
| "IQ": 26433436, | |
| "IR": 1698466, | |
| "JO": 10820600, | |
| "KE": 24623, | |
| "KM": 558545, | |
| "KW": 2993710, | |
| "LB": 4703865, | |
| "LY": 5099000, | |
| "MA": 22048254, | |
| "ML": 175981, | |
| "MR": 3404658, | |
| "NE": 47822, | |
| "NG": 151960, | |
| "OM": 3778520, | |
| "PS": 4818260, | |
| "QA": 2175311, | |
| "SA": 34173500, | |
| "SD": 27792576, | |
| "SO": 3997414, | |
| "SS": 2851524, | |
| "SY": 15518720, | |
| "TD": 2869158, | |
| "TJ": 976, | |
| "TN": 10549080, | |
| "TR": 459298, | |
| "YE": 22114456 | |
| } | |
| }, | |
| { | |
| "language_name": "Urdu", | |
| "bcp_47": "ur", | |
| "speakers": 290790290, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2659144372728079, | |
| "chrf": 44.14831240898717 | |
| } | |
| ], | |
| "bleu": 0.2659144372728079, | |
| "chrf": 44.14831240898717, | |
| "commonvoice_hours": 76.0, | |
| "commonvoice_locale": "ur", | |
| "population": { | |
| "CA": 286475, | |
| "GB": 2301638, | |
| "IN": 66304500, | |
| "MU": 71727, | |
| "PK": 221825950 | |
| } | |
| }, | |
| { | |
| "language_name": "French", | |
| "bcp_47": "fr", | |
| "speakers": 278611507, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.315663773358301, | |
| "chrf": 49.253978669350964 | |
| } | |
| ], | |
| "bleu": 0.315663773358301, | |
| "chrf": 49.253978669350964, | |
| "commonvoice_hours": 1052.0, | |
| "commonvoice_locale": "fr", | |
| "population": { | |
| "AD": 5775, | |
| "AT": 974540, | |
| "BE": 4453866, | |
| "BF": 4583788, | |
| "BI": 7000822, | |
| "BJ": 4502610, | |
| "BL": 6837, | |
| "CA": 11308230, | |
| "CD": 3867640, | |
| "CF": 2935521, | |
| "CG": 4446179, | |
| "CH": 1764838, | |
| "CI": 13465739, | |
| "CM": 18866600, | |
| "CY": 88668, | |
| "DE": 14428746, | |
| "DJ": 19358, | |
| "DZ": 8594580, | |
| "FR": 67169718, | |
| "GA": 1405473, | |
| "GB": 15125053, | |
| "GF": 153622, | |
| "GN": 3632946, | |
| "GP": 407498, | |
| "GQ": 73584, | |
| "GR": 954639, | |
| "HT": 520187, | |
| "HU": 293155, | |
| "IE": 880017, | |
| "IT": 3931370, | |
| "KM": 473917, | |
| "LB": 20238, | |
| "LU": 546691, | |
| "MA": 7112340, | |
| "MC": 38610, | |
| "MF": 32556, | |
| "MG": 18599433, | |
| "ML": 8994564, | |
| "MQ": 427408, | |
| "MR": 680932, | |
| "MT": 50299, | |
| "MU": 41381, | |
| "NC": 278409, | |
| "NE": 6603996, | |
| "NL": 5011316, | |
| "PF": 180024, | |
| "PM": 5133, | |
| "PT": 1545405, | |
| "RE": 700950, | |
| "RO": 3621493, | |
| "RW": 2288, | |
| "SC": 57589, | |
| "SN": 6137196, | |
| "SY": 1144506, | |
| "TD": 4388124, | |
| "TF": 140, | |
| "TG": 5251148, | |
| "TN": 8673688, | |
| "US": 1862778, | |
| "VU": 149166, | |
| "WF": 7610, | |
| "YT": 110580 | |
| } | |
| }, | |
| { | |
| "language_name": "Bangla", | |
| "bcp_47": "bn", | |
| "speakers": 267193288, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.21265887286151353, | |
| "chrf": 41.501657722373686 | |
| } | |
| ], | |
| "bleu": 0.21265887286151353, | |
| "chrf": 41.501657722373686, | |
| "commonvoice_hours": 49.0, | |
| "commonvoice_locale": "bn", | |
| "population": { | |
| "BD": 159397980, | |
| "CA": 90466, | |
| "GB": 263044, | |
| "IN": 107413290, | |
| "NP": 28508 | |
| } | |
| }, | |
| { | |
| "language_name": "Portuguese", | |
| "bcp_47": "pt", | |
| "speakers": 237496885, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.27514792195783394, | |
| "chrf": 45.901248962808694 | |
| } | |
| ], | |
| "bleu": 0.27514792195783394, | |
| "chrf": 45.901248962808694, | |
| "commonvoice_hours": 176.0, | |
| "commonvoice_locale": "pt", | |
| "population": { | |
| "AG": 1571, | |
| "AO": 21789941, | |
| "BR": 192661560, | |
| "CA": 229934, | |
| "CH": 285736, | |
| "CV": 443274, | |
| "FR": 882027, | |
| "GB": 131522, | |
| "GQ": 1, | |
| "GW": 1927100, | |
| "LU": 100541, | |
| "MO": 30723, | |
| "MZ": 8126514, | |
| "PT": 9890592, | |
| "ST": 179454, | |
| "TL": 816395 | |
| } | |
| }, | |
| { | |
| "language_name": "Punjabi", | |
| "bcp_47": "pa", | |
| "speakers": 203571210, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.32250608979374484, | |
| "chrf": 48.43043110055342 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.3048037308116852, | |
| "chrf": 48.4304965568793 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.2314793285308931, | |
| "chrf": 37.53667069805556 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.37468960333154994, | |
| "chrf": 53.381398796420086 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.359056244961623, | |
| "chrf": 52.278269268214366 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.27331521881795146, | |
| "chrf": 45.15087304059057 | |
| } | |
| ], | |
| "bleu": 0.31097503604124127, | |
| "chrf": 47.53468991011888, | |
| "commonvoice_hours": 2.3, | |
| "commonvoice_locale": "pa-IN", | |
| "population": { | |
| "CA": 603106, | |
| "GB": 2367400, | |
| "IN": 37130520, | |
| "KE": 10170, | |
| "PK": 163450700, | |
| "SG": 9314 | |
| } | |
| }, | |
| { | |
| "language_name": "Russian", | |
| "bcp_47": "ru", | |
| "speakers": 195841151, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.26108507692625094, | |
| "chrf": 45.063308940468154 | |
| } | |
| ], | |
| "bleu": 0.26108507692625094, | |
| "chrf": 45.063308940468154, | |
| "commonvoice_hours": 241.0, | |
| "commonvoice_locale": "ru", | |
| "population": { | |
| "BG": 1602387, | |
| "BY": 1137350, | |
| "CA": 211087, | |
| "CN": 13940, | |
| "DE": 4809582, | |
| "EE": 688027, | |
| "FI": 45131, | |
| "GE": 359730, | |
| "IL": 954303, | |
| "KG": 2147364, | |
| "KZ": 13746168, | |
| "LT": 2185168, | |
| "LV": 714867, | |
| "MD": 100935, | |
| "MN": 4118, | |
| "PL": 6890814, | |
| "RU": 133218680, | |
| "SJ": 1200, | |
| "TJ": 1064840, | |
| "TM": 663436, | |
| "UA": 20204534, | |
| "US": 798334, | |
| "UZ": 4279156 | |
| } | |
| }, | |
| { | |
| "language_name": "Swahili", | |
| "bcp_47": "sw", | |
| "speakers": 171610296, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2709203338132304, | |
| "chrf": 44.36399636969686 | |
| } | |
| ], | |
| "bleu": 0.2709203338132304, | |
| "chrf": 44.36399636969686, | |
| "commonvoice_hours": 411.0, | |
| "commonvoice_locale": "sw", | |
| "population": { | |
| "BI": 6408, | |
| "CD": 50890000, | |
| "KE": 35328414, | |
| "MZ": 9330, | |
| "SO": 235142, | |
| "TZ": 52697520, | |
| "UG": 32439750, | |
| "YT": 2716, | |
| "ZA": 1016 | |
| } | |
| }, | |
| { | |
| "language_name": "Indonesian", | |
| "bcp_47": "id", | |
| "speakers": 171207687, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.27441353638286026, | |
| "chrf": 46.025445629112156 | |
| } | |
| ], | |
| "bleu": 0.27441353638286026, | |
| "chrf": 46.025445629112156, | |
| "commonvoice_hours": 33.0, | |
| "commonvoice_locale": "id", | |
| "population": { | |
| "ID": 170896640, | |
| "NL": 311047 | |
| } | |
| }, | |
| { | |
| "language_name": "German", | |
| "bcp_47": "de", | |
| "speakers": 136350226, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.3338682761061998, | |
| "chrf": 50.216731068308064 | |
| } | |
| ], | |
| "bleu": 0.3338682761061998, | |
| "chrf": 50.216731068308064, | |
| "commonvoice_hours": 1357.0, | |
| "commonvoice_locale": "de", | |
| "population": { | |
| "AT": 8593666, | |
| "BE": 2578554, | |
| "BG": 557352, | |
| "BR": 1778414, | |
| "CA": 294014, | |
| "CH": 6134913, | |
| "CZ": 1605375, | |
| "DE": 72945327, | |
| "DK": 2758623, | |
| "FI": 1002901, | |
| "FR": 3392410, | |
| "GB": 5918499, | |
| "GR": 530355, | |
| "HU": 1758929, | |
| "IT": 998443, | |
| "KZ": 1221882, | |
| "LI": 39137, | |
| "LT": 382404, | |
| "LU": 395880, | |
| "NA": 23671, | |
| "NL": 12269084, | |
| "PL": 7273637, | |
| "PY": 208559, | |
| "RO": 44736, | |
| "SI": 883126, | |
| "SK": 1196932, | |
| "US": 1563403 | |
| } | |
| }, | |
| { | |
| "language_name": "Japanese", | |
| "bcp_47": "ja", | |
| "speakers": 119729026, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2940100667664714, | |
| "chrf": 46.403097021492236 | |
| } | |
| ], | |
| "bleu": 0.2940100667664714, | |
| "chrf": 46.403097021492236, | |
| "commonvoice_hours": 222.0, | |
| "commonvoice_locale": "ja", | |
| "population": { | |
| "BR": 444604, | |
| "CA": 52772, | |
| "JP": 119231650 | |
| } | |
| }, | |
| { | |
| "language_name": "Telugu", | |
| "bcp_47": "te", | |
| "speakers": 95478480, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.28964452051612244, | |
| "chrf": 45.75290973782886 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2750887189010237, | |
| "chrf": 46.31463752811596 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.1314237858560668, | |
| "chrf": 27.750433857144273 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.35187073123584545, | |
| "chrf": 52.04190885735586 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.2808664068178743, | |
| "chrf": 48.221979700718 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.16468103557770178, | |
| "chrf": 36.43981433605732 | |
| } | |
| ], | |
| "bleu": 0.24892919981743908, | |
| "chrf": 42.75361400287005, | |
| "commonvoice_hours": 0.3, | |
| "commonvoice_locale": "te", | |
| "population": { | |
| "IN": 95478480 | |
| } | |
| }, | |
| { | |
| "language_name": "Marathi", | |
| "bcp_47": "mr", | |
| "speakers": 92826300, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.235200323237626, | |
| "chrf": 39.43789667749676 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2584800238292114, | |
| "chrf": 44.69889855306244 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.1158656438579424, | |
| "chrf": 27.118712681006436 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.3039098126596327, | |
| "chrf": 48.26657289026638 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.23702154369195902, | |
| "chrf": 43.039588362590955 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.14770612974379574, | |
| "chrf": 35.63558588907277 | |
| } | |
| ], | |
| "bleu": 0.21636391283669454, | |
| "chrf": 39.69954250891596, | |
| "commonvoice_hours": 20.0, | |
| "commonvoice_locale": "mr", | |
| "population": { | |
| "IN": 92826300 | |
| } | |
| }, | |
| { | |
| "language_name": "Javanese", | |
| "bcp_47": "jv", | |
| "speakers": 91180665, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.23082586428104943, | |
| "chrf": 41.42591471734489 | |
| } | |
| ], | |
| "bleu": 0.23082586428104943, | |
| "chrf": 41.42591471734489, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "jv", | |
| "population": { | |
| "ID": 90788840, | |
| "MY": 391825 | |
| } | |
| }, | |
| { | |
| "language_name": "Vietnamese", | |
| "bcp_47": "vi", | |
| "speakers": 86222962, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.2790022403255029, | |
| "chrf": 44.76577365559692 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.252552287345529, | |
| "chrf": 43.351007120897606 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.17142561681893811, | |
| "chrf": 34.23876708175754 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.32076560886563743, | |
| "chrf": 49.46269756420099 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.269842412561934, | |
| "chrf": 44.17252674642975 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.19118351096728373, | |
| "chrf": 37.642090247027234 | |
| } | |
| ], | |
| "bleu": 0.24746194614747083, | |
| "chrf": 42.272143735985004, | |
| "commonvoice_hours": 5.9, | |
| "commonvoice_locale": "vi", | |
| "population": { | |
| "CA": 184701, | |
| "CN": 6970, | |
| "US": 1130973, | |
| "VN": 84900318 | |
| } | |
| }, | |
| { | |
| "language_name": "Tamil", | |
| "bcp_47": "ta", | |
| "speakers": 85616159, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.2159676106476219, | |
| "chrf": 38.592451568525966 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.24147470924504938, | |
| "chrf": 41.98664320436057 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.11055269618146167, | |
| "chrf": 26.929660798631293 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.2993653070835946, | |
| "chrf": 46.760725728832945 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.22772498517043588, | |
| "chrf": 40.963440857462984 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.14949134449145374, | |
| "chrf": 33.188135588116566 | |
| } | |
| ], | |
| "bleu": 0.2074294421366029, | |
| "chrf": 38.07017629098839, | |
| "commonvoice_hours": 234.0, | |
| "commonvoice_locale": "ta", | |
| "population": { | |
| "CA": 184701, | |
| "GB": 2104355, | |
| "IN": 78239310, | |
| "LK": 3433380, | |
| "MU": 34484, | |
| "MY": 1371388, | |
| "RE": 118138, | |
| "SG": 130403 | |
| } | |
| }, | |
| { | |
| "language_name": "Persian", | |
| "bcp_47": "fa", | |
| "speakers": 84710459, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2543274430452483, | |
| "chrf": 44.798186786819564 | |
| } | |
| ], | |
| "bleu": 0.2543274430452483, | |
| "chrf": 44.798186786819564, | |
| "commonvoice_hours": 370.0, | |
| "commonvoice_locale": "fa", | |
| "population": { | |
| "AE": 189850, | |
| "AF": 18321900, | |
| "CA": 245012, | |
| "IQ": 338192, | |
| "IR": 63692475, | |
| "OM": 43849, | |
| "PK": 1541107, | |
| "QA": 268859, | |
| "TJ": 69215 | |
| } | |
| }, | |
| { | |
| "language_name": "Turkish", | |
| "bcp_47": "tr", | |
| "speakers": 80360704, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2848412390293461, | |
| "chrf": 45.023438128876236 | |
| } | |
| ], | |
| "bleu": 0.2848412390293461, | |
| "chrf": 45.023438128876236, | |
| "commonvoice_hours": 127.0, | |
| "commonvoice_locale": "tr", | |
| "population": { | |
| "BG": 766359, | |
| "CA": 37694, | |
| "CY": 291336, | |
| "DE": 2003992, | |
| "GB": 131522, | |
| "GR": 127285, | |
| "MK": 74409, | |
| "NL": 207365, | |
| "RO": 27694, | |
| "TR": 76276275, | |
| "UA": 184476, | |
| "UZ": 232297 | |
| } | |
| }, | |
| { | |
| "language_name": "Cantonese", | |
| "bcp_47": "yue", | |
| "speakers": 79654759, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2745324223697869, | |
| "chrf": 46.18505717482203 | |
| } | |
| ], | |
| "bleu": 0.2745324223697869, | |
| "chrf": 46.18505717482203, | |
| "commonvoice_hours": 203.0, | |
| "commonvoice_locale": "yue", | |
| "population": { | |
| "CA": 640800, | |
| "CN": 72489040, | |
| "HK": 6524919 | |
| } | |
| }, | |
| { | |
| "language_name": "Korean", | |
| "bcp_47": "ko", | |
| "speakers": 78357046, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.21423807187509414, | |
| "chrf": 42.31955622695572 | |
| } | |
| ], | |
| "bleu": 0.21423807187509414, | |
| "chrf": 42.31955622695572, | |
| "commonvoice_hours": 1.7, | |
| "commonvoice_locale": "ko", | |
| "population": { | |
| "BR": 44460, | |
| "CA": 169623, | |
| "CN": 2091030, | |
| "JP": 652636, | |
| "KP": 22566280, | |
| "KR": 51835100, | |
| "US": 997917 | |
| } | |
| }, | |
| { | |
| "language_name": "Italian", | |
| "bcp_47": "it", | |
| "speakers": 70247060, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.29744196180619636, | |
| "chrf": 46.58884190721562 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2947459489130278, | |
| "chrf": 48.23578446556176 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.26709213193768344, | |
| "chrf": 43.42719841351614 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.34518602347709243, | |
| "chrf": 51.45922256128821 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.3136120219290237, | |
| "chrf": 49.456527591725454 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.26629405288011837, | |
| "chrf": 44.95821657057411 | |
| } | |
| ], | |
| "bleu": 0.29739535682385704, | |
| "chrf": 47.35429858498022, | |
| "commonvoice_hours": 362.0, | |
| "commonvoice_locale": "it", | |
| "population": { | |
| "AT": 797350, | |
| "AU": 483864, | |
| "BR": 592805, | |
| "CA": 343016, | |
| "CH": 361372, | |
| "DE": 5611179, | |
| "FR": 1153419, | |
| "GB": 131522, | |
| "HR": 67644, | |
| "IT": 59282565, | |
| "MT": 256070, | |
| "SI": 3995, | |
| "SM": 30466, | |
| "US": 1130973, | |
| "VA": 820 | |
| } | |
| }, | |
| { | |
| "language_name": "Filipino", | |
| "bcp_47": "fil", | |
| "speakers": 67471096, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.3020075248846111, | |
| "chrf": 45.148692233744825 | |
| } | |
| ], | |
| "bleu": 0.3020075248846111, | |
| "chrf": 45.148692233744825, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "tl", | |
| "population": { | |
| "CA": 565412, | |
| "PH": 65508600, | |
| "US": 1397084 | |
| } | |
| }, | |
| { | |
| "language_name": "Egyptian Arabic", | |
| "bcp_47": "arz", | |
| "speakers": 66639360, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.18353324091064518, | |
| "chrf": 37.67362087042454 | |
| } | |
| ], | |
| "bleu": 0.18353324091064518, | |
| "chrf": 37.67362087042454, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "EG": 66639360 | |
| } | |
| }, | |
| { | |
| "language_name": "Gujarati", | |
| "bcp_47": "gu", | |
| "speakers": 61721799, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.27618486571036477, | |
| "chrf": 45.30697533607047 | |
| } | |
| ], | |
| "bleu": 0.27618486571036477, | |
| "chrf": 45.30697533607047, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "gu-IN", | |
| "population": { | |
| "CA": 135699, | |
| "GB": 1907072, | |
| "IN": 59674050, | |
| "KE": 4978 | |
| } | |
| }, | |
| { | |
| "language_name": "Thai", | |
| "bcp_47": "th", | |
| "speakers": 55181920, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2461561900137243, | |
| "chrf": 43.886996888191135 | |
| } | |
| ], | |
| "bleu": 0.2461561900137243, | |
| "chrf": 43.886996888191135, | |
| "commonvoice_hours": 172.0, | |
| "commonvoice_locale": "th", | |
| "population": { | |
| "TH": 55181920 | |
| } | |
| }, | |
| { | |
| "language_name": "Kannada", | |
| "bcp_47": "kn", | |
| "speakers": 49065330, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.25650866519447973, | |
| "chrf": 43.53706086839864 | |
| } | |
| ], | |
| "bleu": 0.25650866519447973, | |
| "chrf": 43.53706086839864, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "kn", | |
| "population": { | |
| "IN": 49065330 | |
| } | |
| }, | |
| { | |
| "language_name": "Malayalam", | |
| "bcp_47": "ml", | |
| "speakers": 43257484, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.23073727076678055, | |
| "chrf": 41.53402359471923 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.21782657144614825, | |
| "chrf": 41.630569782738704 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.1695641998407403, | |
| "chrf": 33.20242503336964 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.3195014249623395, | |
| "chrf": 50.399254960139395 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.2633223158501049, | |
| "chrf": 45.473592535604965 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.19162873119255258, | |
| "chrf": 38.21485785002488 | |
| } | |
| ], | |
| "bleu": 0.23209675234311103, | |
| "chrf": 41.7424539594328, | |
| "commonvoice_hours": 2.8, | |
| "commonvoice_locale": "ml", | |
| "population": { | |
| "AE": 699446, | |
| "BH": 49665, | |
| "IL": 7981, | |
| "IN": 42434880, | |
| "MY": 48978, | |
| "QA": 6599, | |
| "SG": 9935 | |
| } | |
| }, | |
| { | |
| "language_name": "Odia", | |
| "bcp_47": "or", | |
| "speakers": 42434880, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2616054244059909, | |
| "chrf": 44.81898318236423 | |
| } | |
| ], | |
| "bleu": 0.2616054244059909, | |
| "chrf": 44.81898318236423, | |
| "commonvoice_hours": 2.8, | |
| "commonvoice_locale": "or", | |
| "population": { | |
| "IN": 42434880 | |
| } | |
| }, | |
| { | |
| "language_name": "Polish", | |
| "bcp_47": "pl", | |
| "speakers": 41077399, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.24382878885531348, | |
| "chrf": 43.88802125000008 | |
| } | |
| ], | |
| "bleu": 0.24382878885531348, | |
| "chrf": 43.88802125000008, | |
| "commonvoice_hours": 174.0, | |
| "commonvoice_locale": "pl", | |
| "population": { | |
| "CA": 173393, | |
| "CZ": 52442, | |
| "DE": 232463, | |
| "GB": 2630444, | |
| "IL": 130132, | |
| "PL": 36751008, | |
| "RO": 2769, | |
| "SK": 50598, | |
| "UA": 1054150 | |
| } | |
| }, | |
| { | |
| "language_name": "Hausa", | |
| "bcp_47": "ha", | |
| "speakers": 40411882, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.1493358875548207, | |
| "chrf": 31.734228520521885 | |
| } | |
| ], | |
| "bleu": 0.1493358875548207, | |
| "chrf": 31.734228520521885, | |
| "commonvoice_hours": 4.1, | |
| "commonvoice_locale": "ha", | |
| "population": { | |
| "CM": 38843, | |
| "GH": 252326, | |
| "NE": 9336684, | |
| "NG": 29963920, | |
| "SD": 820109 | |
| } | |
| }, | |
| { | |
| "language_name": "Sindhi", | |
| "bcp_47": "sd", | |
| "speakers": 40329510, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.22524971121549384, | |
| "chrf": 41.35718488130492 | |
| } | |
| ], | |
| "bleu": 0.22524971121549384, | |
| "chrf": 41.35718488130492, | |
| "commonvoice_hours": 0.4, | |
| "commonvoice_locale": "sd", | |
| "population": { | |
| "IN": 5304360, | |
| "PK": 35025150 | |
| } | |
| }, | |
| { | |
| "language_name": "Malay", | |
| "bcp_47": "ms", | |
| "speakers": 38097307, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.27545115634664297, | |
| "chrf": 46.5366529956061 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2445459295400275, | |
| "chrf": 43.683725288188164 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.23380594556884363, | |
| "chrf": 38.09288562825641 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.3521510571182875, | |
| "chrf": 51.6107732437805 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.2984537737499322, | |
| "chrf": 47.07139912930323 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.20974647653543713, | |
| "chrf": 40.94603982712764 | |
| } | |
| ], | |
| "bleu": 0.2690257231431951, | |
| "chrf": 44.656912685377016, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "ms", | |
| "population": { | |
| "BN": 455189, | |
| "CC": 495, | |
| "ID": 12283196, | |
| "MY": 24489075, | |
| "SG": 869352 | |
| } | |
| }, | |
| { | |
| "language_name": "Burmese", | |
| "bcp_47": "my", | |
| "speakers": 36559231, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.17529594258449108, | |
| "chrf": 38.09396067803311 | |
| } | |
| ], | |
| "bleu": 0.17529594258449108, | |
| "chrf": 38.09396067803311, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "my", | |
| "population": { | |
| "BD": 341567, | |
| "MM": 36217664 | |
| } | |
| }, | |
| { | |
| "language_name": "Amharic", | |
| "bcp_47": "am", | |
| "speakers": 35728475, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.16453710162389373, | |
| "chrf": 34.89886094698235 | |
| } | |
| ], | |
| "bleu": 0.16453710162389373, | |
| "chrf": 34.89886094698235, | |
| "commonvoice_hours": 1.8, | |
| "commonvoice_locale": "am", | |
| "population": { | |
| "ET": 35677290, | |
| "IL": 51185 | |
| } | |
| }, | |
| { | |
| "language_name": "Oromo", | |
| "bcp_47": "om", | |
| "speakers": 34897121, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.0691897827221633, | |
| "chrf": 22.166735299684706 | |
| } | |
| ], | |
| "bleu": 0.0691897827221633, | |
| "chrf": 22.166735299684706, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "om", | |
| "population": { | |
| "ET": 34596160, | |
| "KE": 251581, | |
| "SO": 49380 | |
| } | |
| }, | |
| { | |
| "language_name": "Bhojpuri", | |
| "bcp_47": "bho", | |
| "speakers": 32934797, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.23176648838308359, | |
| "chrf": 42.06617216025931 | |
| } | |
| ], | |
| "bleu": 0.23176648838308359, | |
| "chrf": 42.06617216025931, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "IN": 30500070, | |
| "MU": 372430, | |
| "NP": 2062297 | |
| } | |
| }, | |
| { | |
| "language_name": "Uzbek", | |
| "bcp_47": "uz", | |
| "speakers": 32792780, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2038544554531401, | |
| "chrf": 39.8364082393657 | |
| } | |
| ], | |
| "bleu": 0.2038544554531401, | |
| "chrf": 39.8364082393657, | |
| "commonvoice_hours": 100.0, | |
| "commonvoice_locale": "uz", | |
| "population": { | |
| "AF": 1722259, | |
| "CN": 5576, | |
| "TM": 497577, | |
| "TR": 1968, | |
| "UZ": 30565400 | |
| } | |
| }, | |
| { | |
| "language_name": "Azerbaijani", | |
| "bcp_47": "az", | |
| "speakers": 32446682, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.1911853993562902, | |
| "chrf": 38.284553121320506 | |
| } | |
| ], | |
| "bleu": 0.1911853993562902, | |
| "chrf": 38.284553121320506, | |
| "commonvoice_hours": 0.5, | |
| "commonvoice_locale": "az", | |
| "population": { | |
| "AM": 0, | |
| "AZ": 10093536, | |
| "IQ": 699709, | |
| "IR": 20381592, | |
| "RU": 131801, | |
| "TR": 1140044 | |
| } | |
| }, | |
| { | |
| "language_name": "Sundanese", | |
| "bcp_47": "su", | |
| "speakers": 32043120, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.18638464691782505, | |
| "chrf": 36.390067106438586 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.22413489641063433, | |
| "chrf": 39.08607675576149 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.12396443500389862, | |
| "chrf": 27.44605100630464 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.31100961611618916, | |
| "chrf": 48.684591434160616 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.23467068441612768, | |
| "chrf": 40.54860164135514 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.1315217916431994, | |
| "chrf": 32.71394871178255 | |
| } | |
| ], | |
| "bleu": 0.20194767841797903, | |
| "chrf": 37.47822277596717, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "ID": 32043120 | |
| } | |
| }, | |
| { | |
| "language_name": "Dutch", | |
| "bcp_47": "nl", | |
| "speakers": 31765645, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2592795402705898, | |
| "chrf": 44.356739380497835 | |
| } | |
| ], | |
| "bleu": 0.2592795402705898, | |
| "chrf": 44.356739380497835, | |
| "commonvoice_hours": 114.0, | |
| "commonvoice_locale": "nl", | |
| "population": { | |
| "AW": 115845, | |
| "BE": 6446385, | |
| "BQ": 1600, | |
| "CA": 56541, | |
| "CW": 12108, | |
| "DE": 7214373, | |
| "FR": 88203, | |
| "NL": 17280400, | |
| "SR": 548612, | |
| "SX": 1578 | |
| } | |
| }, | |
| { | |
| "language_name": "Moroccan Arabic", | |
| "bcp_47": "ary", | |
| "speakers": 30938679, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.1795140543637709, | |
| "chrf": 37.426822543484725 | |
| } | |
| ], | |
| "bleu": 0.1795140543637709, | |
| "chrf": 37.426822543484725, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "MA": 30938679 | |
| } | |
| }, | |
| { | |
| "language_name": "Ukrainian", | |
| "bcp_47": "uk", | |
| "speakers": 29348975, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.2564463888571809, | |
| "chrf": 41.5181715644979 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2922812040972885, | |
| "chrf": 46.82127627710616 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.24225796102393954, | |
| "chrf": 39.42058485499366 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.3452563778145038, | |
| "chrf": 50.96771482708702 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.3292127494173498, | |
| "chrf": 48.580427643849056 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.2452825737163755, | |
| "chrf": 42.05493360532406 | |
| } | |
| ], | |
| "bleu": 0.28512287582110635, | |
| "chrf": 44.893851462142976, | |
| "commonvoice_hours": 98.0, | |
| "commonvoice_locale": "uk", | |
| "population": { | |
| "CA": 75388, | |
| "MD": 471030, | |
| "PL": 149301, | |
| "RS": 0, | |
| "SK": 103371, | |
| "UA": 28549885 | |
| } | |
| }, | |
| { | |
| "language_name": "Yoruba", | |
| "bcp_47": "yo", | |
| "speakers": 28685568, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.09852676389614487, | |
| "chrf": 25.656950226425916 | |
| } | |
| ], | |
| "bleu": 0.09852676389614487, | |
| "chrf": 25.656950226425916, | |
| "commonvoice_hours": 5.9, | |
| "commonvoice_locale": "yo", | |
| "population": { | |
| "BJ": 861928, | |
| "NG": 27823640 | |
| } | |
| }, | |
| { | |
| "language_name": "Igbo", | |
| "bcp_47": "ig", | |
| "speakers": 27823640, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.1549827013842116, | |
| "chrf": 35.431035675871804 | |
| } | |
| ], | |
| "bleu": 0.1549827013842116, | |
| "chrf": 35.431035675871804, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "ig", | |
| "population": { | |
| "NG": 27823640 | |
| } | |
| }, | |
| { | |
| "language_name": "Cebuano", | |
| "bcp_47": "ceb", | |
| "speakers": 26203440, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.27783470672988303, | |
| "chrf": 43.53549785827671 | |
| } | |
| ], | |
| "bleu": 0.27783470672988303, | |
| "chrf": 43.53549785827671, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "PH": 26203440 | |
| } | |
| }, | |
| { | |
| "language_name": "Awadhi", | |
| "bcp_47": "awa", | |
| "speakers": 25862924, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2554810263222905, | |
| "chrf": 42.35795046006446 | |
| } | |
| ], | |
| "bleu": 0.2554810263222905, | |
| "chrf": 42.35795046006446, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "IN": 25195710, | |
| "NP": 667214 | |
| } | |
| }, | |
| { | |
| "language_name": "Malagasy", | |
| "bcp_47": "mg", | |
| "speakers": 24260130, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.15163299980391426, | |
| "chrf": 32.41299083831688 | |
| } | |
| ], | |
| "bleu": 0.15163299980391426, | |
| "chrf": 32.41299083831688, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "mg", | |
| "population": { | |
| "MG": 24260130 | |
| } | |
| }, | |
| { | |
| "language_name": "Romanian", | |
| "bcp_47": "ro", | |
| "speakers": 22187408, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.33899025568959984, | |
| "chrf": 49.419389839471826 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.26666997541189236, | |
| "chrf": 44.76525386460237 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.24172488724041316, | |
| "chrf": 37.98045602918644 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.37365302832845815, | |
| "chrf": 52.777299654432 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.332600965807992, | |
| "chrf": 49.14582652136321 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.2510789925018768, | |
| "chrf": 42.27877315264307 | |
| } | |
| ], | |
| "bleu": 0.30078635083003874, | |
| "chrf": 46.06116651028316, | |
| "commonvoice_hours": 21.0, | |
| "commonvoice_locale": "ro", | |
| "population": { | |
| "CA": 101774, | |
| "HU": 96741, | |
| "IL": 320993, | |
| "MD": 2119635, | |
| "RO": 19172610, | |
| "RS": 147256, | |
| "UA": 228399 | |
| } | |
| }, | |
| { | |
| "language_name": "Nepali", | |
| "bcp_47": "ne", | |
| "speakers": 20903374, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.26199282928489126, | |
| "chrf": 44.7560662712792 | |
| } | |
| ], | |
| "bleu": 0.26199282928489126, | |
| "chrf": 44.7560662712792, | |
| "commonvoice_hours": 1.3, | |
| "commonvoice_locale": "ne-NP", | |
| "population": { | |
| "BT": 132994, | |
| "IN": 7426104, | |
| "NP": 13344276 | |
| } | |
| }, | |
| { | |
| "language_name": "Maithili", | |
| "bcp_47": "mai", | |
| "speakers": 19249149, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.23975507119180453, | |
| "chrf": 41.8894484718934 | |
| } | |
| ], | |
| "bleu": 0.23975507119180453, | |
| "chrf": 41.8894484718934, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "mai", | |
| "population": { | |
| "IN": 15913080, | |
| "NP": 3336069 | |
| } | |
| }, | |
| { | |
| "language_name": "Assamese", | |
| "bcp_47": "as", | |
| "speakers": 17239170, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.19363225565136952, | |
| "chrf": 38.96237165376663 | |
| } | |
| ], | |
| "bleu": 0.19363225565136952, | |
| "chrf": 38.96237165376663, | |
| "commonvoice_hours": 2.8, | |
| "commonvoice_locale": "as", | |
| "population": { | |
| "IN": 17239170 | |
| } | |
| }, | |
| { | |
| "language_name": "Nyanja", | |
| "bcp_47": "ny", | |
| "speakers": 17026781, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.09504458945778768, | |
| "chrf": 27.576030002164906 | |
| } | |
| ], | |
| "bleu": 0.09504458945778768, | |
| "chrf": 27.576030002164906, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "ny", | |
| "population": { | |
| "MW": 13353858, | |
| "MZ": 782553, | |
| "ZM": 2613990, | |
| "ZW": 276380 | |
| } | |
| }, | |
| { | |
| "language_name": "Somali", | |
| "bcp_47": "so", | |
| "speakers": 16911645, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.2024994684991584, | |
| "chrf": 37.37281822856629 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.1532133716194419, | |
| "chrf": 32.05620028647162 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.043408496427191995, | |
| "chrf": 15.267715935014895 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.3048371831537258, | |
| "chrf": 46.24092673305936 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.21360545410615966, | |
| "chrf": 38.32357547187653 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.06484340154849859, | |
| "chrf": 22.781181465233722 | |
| } | |
| ], | |
| "bleu": 0.16373456255902938, | |
| "chrf": 32.00706968670374, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "so", | |
| "population": { | |
| "CA": 49002, | |
| "DJ": 377940, | |
| "ET": 6486780, | |
| "GB": 131522, | |
| "KE": 695863, | |
| "SO": 9170538 | |
| } | |
| }, | |
| { | |
| "language_name": "Magahi", | |
| "bcp_47": "mag", | |
| "speakers": 15913080, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.29925558767802407, | |
| "chrf": 47.539870710677974 | |
| } | |
| ], | |
| "bleu": 0.29925558767802407, | |
| "chrf": 47.539870710677974, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "IN": 15913080 | |
| } | |
| }, | |
| { | |
| "language_name": "Serbian", | |
| "bcp_47": "sr", | |
| "speakers": 15602410, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.26029402164210574, | |
| "chrf": 44.75391848259974 | |
| } | |
| ], | |
| "bleu": 0.26029402164210574, | |
| "chrf": 44.75391848259974, | |
| "commonvoice_hours": 7.4, | |
| "commonvoice_locale": "sr", | |
| "population": { | |
| "BA": 767118, | |
| "CA": 64080, | |
| "ME": 640352, | |
| "RO": 25563, | |
| "RS": 13884096, | |
| "RU": 4960, | |
| "TR": 22965, | |
| "XK": 193276 | |
| } | |
| }, | |
| { | |
| "language_name": "Sinhala", | |
| "bcp_47": "si", | |
| "speakers": 15564656, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.20259734060180434, | |
| "chrf": 39.00188422851495 | |
| } | |
| ], | |
| "bleu": 0.20259734060180434, | |
| "chrf": 39.00188422851495, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "si", | |
| "population": { | |
| "LK": 15564656 | |
| } | |
| }, | |
| { | |
| "language_name": "Khmer", | |
| "bcp_47": "km", | |
| "speakers": 15065030, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.21699232146684352, | |
| "chrf": 41.99979148031644 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.21417349432612984, | |
| "chrf": 41.35771196976409 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.03287369352293625, | |
| "chrf": 14.140423341647319 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.34264229339556035, | |
| "chrf": 51.55826045210756 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.24630515818736093, | |
| "chrf": 44.60963216433486 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.11830648687368288, | |
| "chrf": 31.534012306448343 | |
| } | |
| ], | |
| "bleu": 0.1952155746287523, | |
| "chrf": 37.53330528576977, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "km", | |
| "population": { | |
| "KH": 15065030 | |
| } | |
| }, | |
| { | |
| "language_name": "Chhattisgarhi", | |
| "bcp_47": "hne", | |
| "speakers": 14586990, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2212498883000727, | |
| "chrf": 39.102114067893005 | |
| } | |
| ], | |
| "bleu": 0.2212498883000727, | |
| "chrf": 39.102114067893005, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "IN": 14586990 | |
| } | |
| }, | |
| { | |
| "language_name": "Nigerian Fulfulde", | |
| "bcp_47": "fuv", | |
| "speakers": 14339876, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.08190470208193343, | |
| "chrf": 23.041107899884107 | |
| } | |
| ], | |
| "bleu": 0.08190470208193343, | |
| "chrf": 23.041107899884107, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "NG": 14339876 | |
| } | |
| }, | |
| { | |
| "language_name": "Zulu", | |
| "bcp_47": "zu", | |
| "speakers": 13973830, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.15449146502209737, | |
| "chrf": 33.087212745906356 | |
| } | |
| ], | |
| "bleu": 0.15449146502209737, | |
| "chrf": 33.087212745906356, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "zu", | |
| "population": { | |
| "LS": 275706, | |
| "MW": 69949, | |
| "MZ": 1806, | |
| "SZ": 75105, | |
| "ZA": 13551264 | |
| } | |
| }, | |
| { | |
| "language_name": "Kazakh", | |
| "bcp_47": "kk", | |
| "speakers": 13637392, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2392246097188628, | |
| "chrf": 42.67763456362536 | |
| } | |
| ], | |
| "bleu": 0.2392246097188628, | |
| "chrf": 42.67763456362536, | |
| "commonvoice_hours": 2.1, | |
| "commonvoice_locale": "kk", | |
| "population": { | |
| "AF": 2015, | |
| "CN": 1184917, | |
| "IR": 2972, | |
| "KZ": 12218816, | |
| "MN": 228098, | |
| "TR": 574 | |
| } | |
| }, | |
| { | |
| "language_name": "Czech", | |
| "bcp_47": "cs", | |
| "speakers": 13045532, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2844520855192069, | |
| "chrf": 47.327010269160255 | |
| } | |
| ], | |
| "bleu": 0.2844520855192069, | |
| "chrf": 47.327010269160255, | |
| "commonvoice_hours": 74.0, | |
| "commonvoice_locale": "cs", | |
| "population": { | |
| "CZ": 10488450, | |
| "SK": 2557082 | |
| } | |
| }, | |
| { | |
| "language_name": "Swedish", | |
| "bcp_47": "sv", | |
| "speakers": 12932871, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.31838456223051165, | |
| "chrf": 48.08041424667649 | |
| } | |
| ], | |
| "bleu": 0.31838456223051165, | |
| "chrf": 48.08041424667649, | |
| "commonvoice_hours": 47.0, | |
| "commonvoice_locale": "sv-SE", | |
| "population": { | |
| "AX": 25938, | |
| "DK": 763023, | |
| "FI": 2451535, | |
| "SE": 9692375 | |
| } | |
| }, | |
| { | |
| "language_name": "Hungarian", | |
| "bcp_47": "hu", | |
| "speakers": 12443430, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2517614908428288, | |
| "chrf": 42.77520440394925 | |
| } | |
| ], | |
| "bleu": 0.2517614908428288, | |
| "chrf": 42.77520440394925, | |
| "commonvoice_hours": 92.0, | |
| "commonvoice_locale": "hu", | |
| "population": { | |
| "AT": 23035, | |
| "CA": 49002, | |
| "HU": 9771830, | |
| "IL": 86755, | |
| "RO": 1405991, | |
| "RS": 336584, | |
| "SI": 9252, | |
| "SK": 598466, | |
| "UA": 162515 | |
| } | |
| }, | |
| { | |
| "language_name": "Greek", | |
| "bcp_47": "el", | |
| "speakers": 12292242, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.24888370153898132, | |
| "chrf": 42.743109839531535 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.27269196827838943, | |
| "chrf": 45.53483489961114 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.21351544070708506, | |
| "chrf": 39.64425368969459 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.3500489758234636, | |
| "chrf": 51.1729677922222 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.32858632704534785, | |
| "chrf": 49.70348294319061 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.1903000734693107, | |
| "chrf": 39.41911092527115 | |
| } | |
| ], | |
| "bleu": 0.2673377478104297, | |
| "chrf": 44.7029600149202, | |
| "commonvoice_hours": 20.0, | |
| "commonvoice_locale": "el", | |
| "population": { | |
| "AL": 58417, | |
| "CA": 124391, | |
| "CY": 1203346, | |
| "DE": 304607, | |
| "EG": 63516, | |
| "GR": 10501029, | |
| "IT": 21841, | |
| "RO": 4048, | |
| "TR": 4019, | |
| "UA": 7028 | |
| } | |
| }, | |
| { | |
| "language_name": "Shona", | |
| "bcp_47": "sn", | |
| "speakers": 11782503, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.10438047654339373, | |
| "chrf": 28.358507205354343 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.1054140213254438, | |
| "chrf": 28.275522446025796 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.049580893458705456, | |
| "chrf": 18.458313551880636 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.20979752102494492, | |
| "chrf": 38.7737276002067 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.14066476436038525, | |
| "chrf": 32.050887533047465 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.060530921002659346, | |
| "chrf": 22.35054590384825 | |
| } | |
| ], | |
| "bleu": 0.11172809961925541, | |
| "chrf": 28.04458404006053, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "ZW": 11782503 | |
| } | |
| }, | |
| { | |
| "language_name": "Central Kurdish", | |
| "bcp_47": "ckb", | |
| "speakers": 11086549, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.20654412682006296, | |
| "chrf": 38.66802600490074 | |
| } | |
| ], | |
| "bleu": 0.20654412682006296, | |
| "chrf": 38.66802600490074, | |
| "commonvoice_hours": 135.0, | |
| "commonvoice_locale": "ckb", | |
| "population": { | |
| "IQ": 7774540, | |
| "IR": 3312009 | |
| } | |
| }, | |
| { | |
| "language_name": "Kinyarwanda", | |
| "bcp_47": "rw", | |
| "speakers": 11083625, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.14006909985587948, | |
| "chrf": 31.739340000779823 | |
| } | |
| ], | |
| "bleu": 0.14006909985587948, | |
| "chrf": 31.739340000779823, | |
| "commonvoice_hours": 2002.0, | |
| "commonvoice_locale": "rw", | |
| "population": { | |
| "CD": 386764, | |
| "RW": 9788548, | |
| "UG": 908313 | |
| } | |
| }, | |
| { | |
| "language_name": "Wolof", | |
| "bcp_47": "wo", | |
| "speakers": 11025494, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.08408628490585719, | |
| "chrf": 23.767561072306325 | |
| } | |
| ], | |
| "bleu": 0.08408628490585719, | |
| "chrf": 23.767561072306325, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "wo", | |
| "population": { | |
| "MR": 10014, | |
| "SN": 11015480 | |
| } | |
| }, | |
| { | |
| "language_name": "Tunisian Arabic", | |
| "bcp_47": "aeb", | |
| "speakers": 10549080, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.23738824104522893, | |
| "chrf": 42.85642541970995 | |
| } | |
| ], | |
| "bleu": 0.23738824104522893, | |
| "chrf": 42.85642541970995, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "TN": 10549080 | |
| } | |
| }, | |
| { | |
| "language_name": "Iloko", | |
| "bcp_47": "ilo", | |
| "speakers": 10481376, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.20685666710862224, | |
| "chrf": 37.066073786659494 | |
| } | |
| ], | |
| "bleu": 0.20685666710862224, | |
| "chrf": 37.066073786659494, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "PH": 10481376 | |
| } | |
| }, | |
| { | |
| "language_name": "Xhosa", | |
| "bcp_47": "xh", | |
| "speakers": 10182944, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.1143143326923908, | |
| "chrf": 28.93119601652647 | |
| } | |
| ], | |
| "bleu": 0.1143143326923908, | |
| "chrf": 28.93119601652647, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "xh", | |
| "population": { | |
| "LS": 19496, | |
| "ZA": 10163448 | |
| } | |
| }, | |
| { | |
| "language_name": "Tigrinya", | |
| "bcp_47": "ti", | |
| "speakers": 10145911, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.08532345270447181, | |
| "chrf": 25.148121650983146 | |
| } | |
| ], | |
| "bleu": 0.08532345270447181, | |
| "chrf": 25.148121650983146, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "ti", | |
| "population": { | |
| "ER": 3648720, | |
| "ET": 6486780, | |
| "IL": 10411 | |
| } | |
| }, | |
| { | |
| "language_name": "Belarusian", | |
| "bcp_47": "be", | |
| "speakers": 10064517, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.18341973561481445, | |
| "chrf": 39.828398360117035 | |
| } | |
| ], | |
| "bleu": 0.18341973561481445, | |
| "chrf": 39.828398360117035, | |
| "commonvoice_hours": 1804.0, | |
| "commonvoice_locale": "be", | |
| "population": { | |
| "BY": 9477920, | |
| "PL": 222037, | |
| "UA": 364560 | |
| } | |
| }, | |
| { | |
| "language_name": "Luba-Lulua", | |
| "bcp_47": "lua", | |
| "speakers": 9770880, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.11581604983636683, | |
| "chrf": 28.08252510561598 | |
| } | |
| ], | |
| "bleu": 0.11581604983636683, | |
| "chrf": 28.08252510561598, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "CD": 9770880 | |
| } | |
| }, | |
| { | |
| "language_name": "Tajik", | |
| "bcp_47": "tg", | |
| "speakers": 9644223, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.1846236171638531, | |
| "chrf": 39.50004300248175 | |
| } | |
| ], | |
| "bleu": 0.1846236171638531, | |
| "chrf": 39.50004300248175, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "tg", | |
| "population": { | |
| "PK": 770553, | |
| "TJ": 8873670 | |
| } | |
| }, | |
| { | |
| "language_name": "Umbundu", | |
| "bcp_47": "umb", | |
| "speakers": 9431467, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.05520341910203098, | |
| "chrf": 20.443280736080066 | |
| } | |
| ], | |
| "bleu": 0.05520341910203098, | |
| "chrf": 20.443280736080066, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "AO": 9431467 | |
| } | |
| }, | |
| { | |
| "language_name": "Bambara", | |
| "bcp_47": "bm", | |
| "speakers": 9385632, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.07227674667013836, | |
| "chrf": 22.136582910055218 | |
| } | |
| ], | |
| "bleu": 0.07227674667013836, | |
| "chrf": 22.136582910055218, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "bm", | |
| "population": { | |
| "ML": 9385632 | |
| } | |
| }, | |
| { | |
| "language_name": "Afrikaans", | |
| "bcp_47": "af", | |
| "speakers": 9318845, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.3277177864074156, | |
| "chrf": 48.61873150516328 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.31538459755111, | |
| "chrf": 47.75260784921264 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.26710030799119333, | |
| "chrf": 38.869810330084285 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.4361740814378139, | |
| "chrf": 56.524736028951835 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.37149647257024515, | |
| "chrf": 53.20003536968165 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.2883662842075808, | |
| "chrf": 45.203083386764426 | |
| } | |
| ], | |
| "bleu": 0.3343732550275598, | |
| "chrf": 48.361500744976354, | |
| "commonvoice_hours": 0.5, | |
| "commonvoice_locale": "af", | |
| "population": { | |
| "BW": 6025, | |
| "NA": 1972552, | |
| "ZA": 7340268 | |
| } | |
| }, | |
| { | |
| "language_name": "Kikuyu", | |
| "bcp_47": "ki", | |
| "speakers": 9099743, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.0883556207236924, | |
| "chrf": 24.868277910094278 | |
| } | |
| ], | |
| "bleu": 0.0883556207236924, | |
| "chrf": 24.868277910094278, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "ki", | |
| "population": { | |
| "KE": 9099743 | |
| } | |
| }, | |
| { | |
| "language_name": "Haitian Creole", | |
| "bcp_47": "ht", | |
| "speakers": 8964918, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.1872609836464467, | |
| "chrf": 37.00166091804026 | |
| } | |
| ], | |
| "bleu": 0.1872609836464467, | |
| "chrf": 37.00166091804026, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "ht", | |
| "population": { | |
| "HT": 8964918 | |
| } | |
| }, | |
| { | |
| "language_name": "Catalan", | |
| "bcp_47": "ca", | |
| "speakers": 8679139, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.29445274007068095, | |
| "chrf": 47.46074814103581 | |
| } | |
| ], | |
| "bleu": 0.29445274007068095, | |
| "chrf": 47.46074814103581, | |
| "commonvoice_hours": 2842.0, | |
| "commonvoice_locale": "ca", | |
| "population": { | |
| "AD": 39270, | |
| "ES": 8502686, | |
| "FR": 115342, | |
| "IT": 21841 | |
| } | |
| }, | |
| { | |
| "language_name": "Hebrew", | |
| "bcp_47": "he", | |
| "speakers": 8675480, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2824719214447976, | |
| "chrf": 46.279771845770604 | |
| } | |
| ], | |
| "bleu": 0.2824719214447976, | |
| "chrf": 46.279771845770604, | |
| "commonvoice_hours": 1.1, | |
| "commonvoice_locale": "he", | |
| "population": { | |
| "IL": 8675480 | |
| } | |
| }, | |
| { | |
| "language_name": "Mossi", | |
| "bcp_47": "mos", | |
| "speakers": 8334160, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.08102496244147746, | |
| "chrf": 22.184797797745208 | |
| } | |
| ], | |
| "bleu": 0.08102496244147746, | |
| "chrf": 22.184797797745208, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "mos", | |
| "population": { | |
| "BF": 8334160 | |
| } | |
| }, | |
| { | |
| "language_name": "Kimbundu", | |
| "bcp_47": "kmb", | |
| "speakers": 8130575, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.07329500673809967, | |
| "chrf": 22.838222030254723 | |
| } | |
| ], | |
| "bleu": 0.07329500673809967, | |
| "chrf": 22.838222030254723, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "AO": 8130575 | |
| } | |
| }, | |
| { | |
| "language_name": "Uyghur", | |
| "bcp_47": "ug", | |
| "speakers": 8052967, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.18397910035998616, | |
| "chrf": 35.50154017198535 | |
| } | |
| ], | |
| "bleu": 0.18397910035998616, | |
| "chrf": 35.50154017198535, | |
| "commonvoice_hours": 361.0, | |
| "commonvoice_locale": "ug", | |
| "population": { | |
| "AF": 3005, | |
| "CN": 7667110, | |
| "KZ": 381838, | |
| "MN": 1014 | |
| } | |
| }, | |
| { | |
| "language_name": "Minangkabau", | |
| "bcp_47": "min", | |
| "speakers": 8010780, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.22401269807719826, | |
| "chrf": 40.34678123737912 | |
| } | |
| ], | |
| "bleu": 0.22401269807719826, | |
| "chrf": 40.34678123737912, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "ID": 8010780 | |
| } | |
| }, | |
| { | |
| "language_name": "Bulgarian", | |
| "bcp_47": "bg", | |
| "speakers": 7878315, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.24723779163445408, | |
| "chrf": 45.55403997487483 | |
| } | |
| ], | |
| "bleu": 0.24723779163445408, | |
| "chrf": 45.55403997487483, | |
| "commonvoice_hours": 16.0, | |
| "commonvoice_locale": "bg", | |
| "population": { | |
| "BG": 6966900, | |
| "GR": 28639, | |
| "MD": 316263, | |
| "RO": 6817, | |
| "TR": 344474, | |
| "UA": 215222 | |
| } | |
| }, | |
| { | |
| "language_name": "Standard Moroccan Tamazight", | |
| "bcp_47": "zgh", | |
| "speakers": 7823574, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.0366272802298245, | |
| "chrf": 15.463910171449278 | |
| } | |
| ], | |
| "bleu": 0.0366272802298245, | |
| "chrf": 15.463910171449278, | |
| "commonvoice_hours": 1.3, | |
| "commonvoice_locale": "zgh", | |
| "population": { | |
| "MA": 7823574 | |
| } | |
| }, | |
| { | |
| "language_name": "Bosnian", | |
| "bcp_47": "bs", | |
| "speakers": 7594468, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.3051247921441283, | |
| "chrf": 48.3731481201238 | |
| } | |
| ], | |
| "bleu": 0.3051247921441283, | |
| "chrf": 48.3731481201238, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "bs", | |
| "population": { | |
| "BA": 7594468 | |
| } | |
| }, | |
| { | |
| "language_name": "Rundi", | |
| "bcp_47": "rn", | |
| "speakers": 7475454, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.0957054530624, | |
| "chrf": 28.269164219007447 | |
| } | |
| ], | |
| "bleu": 0.0957054530624, | |
| "chrf": 28.269164219007447, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "BI": 7475454 | |
| } | |
| }, | |
| { | |
| "language_name": "Santali", | |
| "bcp_47": "sat", | |
| "speakers": 7293495, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.11554870024021023, | |
| "chrf": 29.549934477174254 | |
| } | |
| ], | |
| "bleu": 0.11554870024021023, | |
| "chrf": 29.549934477174254, | |
| "commonvoice_hours": 0.5, | |
| "commonvoice_locale": "sat", | |
| "population": { | |
| "IN": 7293495 | |
| } | |
| }, | |
| { | |
| "language_name": "Danish", | |
| "bcp_47": "da", | |
| "speakers": 7072056, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.3512857581168584, | |
| "chrf": 51.12453594191334 | |
| } | |
| ], | |
| "bleu": 0.3512857581168584, | |
| "chrf": 51.12453594191334, | |
| "commonvoice_hours": 13.0, | |
| "commonvoice_locale": "da", | |
| "population": { | |
| "DE": 1603194, | |
| "DK": 5458551, | |
| "GL": 8066, | |
| "IS": 2245 | |
| } | |
| }, | |
| { | |
| "language_name": "Turkmen", | |
| "bcp_47": "tk", | |
| "speakers": 6870838, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.15410064596625964, | |
| "chrf": 36.3602620147462 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.14820890318014426, | |
| "chrf": 34.78567738931005 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.07938993687949465, | |
| "chrf": 24.385063397578556 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.2761834512123037, | |
| "chrf": 47.41646574422384 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.1718597543270264, | |
| "chrf": 38.84762953076257 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.10118596975980092, | |
| "chrf": 28.31840639855478 | |
| } | |
| ], | |
| "bleu": 0.15515477688750492, | |
| "chrf": 35.018917412529326, | |
| "commonvoice_hours": 2.8, | |
| "commonvoice_locale": "tk", | |
| "population": { | |
| "AF": 622945, | |
| "IR": 2377852, | |
| "TM": 3870041 | |
| } | |
| }, | |
| { | |
| "language_name": "Kurdish", | |
| "bcp_47": "ku", | |
| "speakers": 6866757, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.14440915289810186, | |
| "chrf": 31.3622869278075 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.15987085387022903, | |
| "chrf": 35.18523232721762 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.10987778830152085, | |
| "chrf": 25.91454653951599 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.28985769410441137, | |
| "chrf": 46.64309582634758 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.1865343501300658, | |
| "chrf": 37.28483871763787 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.10000019378200214, | |
| "chrf": 26.406217887319293 | |
| } | |
| ], | |
| "bleu": 0.16509167218105517, | |
| "chrf": 33.79936970430764, | |
| "commonvoice_hours": 69.0, | |
| "commonvoice_locale": "kmr", | |
| "population": { | |
| "AM": 99704, | |
| "AZ": 24494, | |
| "DE": 529054, | |
| "GE": 35573, | |
| "LB": 92983, | |
| "SY": 1551872, | |
| "TM": 22115, | |
| "TR": 4510962 | |
| } | |
| }, | |
| { | |
| "language_name": "Croatian", | |
| "bcp_47": "hr", | |
| "speakers": 6813164, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2290484937313612, | |
| "chrf": 41.79307139114272 | |
| } | |
| ], | |
| "bleu": 0.2290484937313612, | |
| "chrf": 41.79307139114272, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "hr", | |
| "population": { | |
| "AT": 106313, | |
| "BA": 460271, | |
| "CA": 45233, | |
| "DE": 633262, | |
| "HR": 4185472, | |
| "HU": 31270, | |
| "IT": 3495, | |
| "RS": 65213, | |
| "SI": 1282635 | |
| } | |
| }, | |
| { | |
| "language_name": "Albanian", | |
| "bcp_47": "sq", | |
| "speakers": 6791906, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.26490711574268994, | |
| "chrf": 44.54318851690701 | |
| } | |
| ], | |
| "bleu": 0.26490711574268994, | |
| "chrf": 44.54318851690701, | |
| "commonvoice_hours": 8.8, | |
| "commonvoice_locale": "sq", | |
| "population": { | |
| "AL": 3074580, | |
| "GR": 9971, | |
| "ME": 48179, | |
| "MK": 531492, | |
| "RS": 1332312, | |
| "TR": 17224, | |
| "XK": 1778148 | |
| } | |
| }, | |
| { | |
| "language_name": "Slovak", | |
| "bcp_47": "sk", | |
| "speakers": 6680269, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2826836020834733, | |
| "chrf": 45.73110764547564 | |
| } | |
| ], | |
| "bleu": 0.2826836020834733, | |
| "chrf": 45.73110764547564, | |
| "commonvoice_hours": 40.0, | |
| "commonvoice_locale": "sk", | |
| "population": { | |
| "CZ": 1712400, | |
| "HU": 11726, | |
| "RS": 59603, | |
| "SK": 4896540 | |
| } | |
| }, | |
| { | |
| "language_name": "Dyula", | |
| "bcp_47": "dyu", | |
| "speakers": 6667328, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.0633017924291756, | |
| "chrf": 21.71247042480193 | |
| } | |
| ], | |
| "bleu": 0.0633017924291756, | |
| "chrf": 21.71247042480193, | |
| "commonvoice_hours": 0.3, | |
| "commonvoice_locale": "dyu", | |
| "population": { | |
| "BF": 6667328 | |
| } | |
| }, | |
| { | |
| "language_name": "Mongolian", | |
| "bcp_47": "mn", | |
| "speakers": 6572846, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.1950781841033538, | |
| "chrf": 41.09779803278993 | |
| } | |
| ], | |
| "bleu": 0.1950781841033538, | |
| "chrf": 41.09779803278993, | |
| "commonvoice_hours": 46.0, | |
| "commonvoice_locale": "mn", | |
| "population": { | |
| "CN": 3624452, | |
| "MN": 2946268, | |
| "RU": 2126 | |
| } | |
| }, | |
| { | |
| "language_name": "Southern Sotho", | |
| "bcp_47": "st", | |
| "speakers": 6390567, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.12381413258013083, | |
| "chrf": 28.651371806370722 | |
| } | |
| ], | |
| "bleu": 0.12381413258013083, | |
| "chrf": 28.651371806370722, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "st", | |
| "population": { | |
| "LS": 1929943, | |
| "ZA": 4460624 | |
| } | |
| }, | |
| { | |
| "language_name": "Tswana", | |
| "bcp_47": "tn", | |
| "speakers": 6113428, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.09139131060492443, | |
| "chrf": 25.97258334431281 | |
| } | |
| ], | |
| "bleu": 0.09139131060492443, | |
| "chrf": 25.97258334431281, | |
| "commonvoice_hours": 4.2, | |
| "commonvoice_locale": "tn", | |
| "population": { | |
| "BW": 1436683, | |
| "NA": 14728, | |
| "ZA": 4630015, | |
| "ZW": 32002 | |
| } | |
| }, | |
| { | |
| "language_name": "Guarani", | |
| "bcp_47": "gn", | |
| "speakers": 5827107, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.12296923497272805, | |
| "chrf": 29.040238903610113 | |
| } | |
| ], | |
| "bleu": 0.12296923497272805, | |
| "chrf": 29.040238903610113, | |
| "commonvoice_hours": 3.7, | |
| "commonvoice_locale": "gn", | |
| "population": { | |
| "AR": 21375, | |
| "BO": 52380, | |
| "PY": 5753352 | |
| } | |
| }, | |
| { | |
| "language_name": "Finnish", | |
| "bcp_47": "fi", | |
| "speakers": 5736842, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2306868672081301, | |
| "chrf": 42.094559446408105 | |
| } | |
| ], | |
| "bleu": 0.2306868672081301, | |
| "chrf": 42.094559446408105, | |
| "commonvoice_hours": 15.0, | |
| "commonvoice_locale": "fi", | |
| "population": { | |
| "EE": 258010, | |
| "FI": 5237370, | |
| "RU": 17007, | |
| "SE": 224455 | |
| } | |
| }, | |
| { | |
| "language_name": "Ganda", | |
| "bcp_47": "lg", | |
| "speakers": 5622890, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.09865217050437662, | |
| "chrf": 25.926064361947446 | |
| } | |
| ], | |
| "bleu": 0.09865217050437662, | |
| "chrf": 25.926064361947446, | |
| "commonvoice_hours": 437.0, | |
| "commonvoice_locale": "lg", | |
| "population": { | |
| "UG": 5622890 | |
| } | |
| }, | |
| { | |
| "language_name": "Kashmiri", | |
| "bcp_47": "ks", | |
| "speakers": 5598085, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.1344939664526747, | |
| "chrf": 32.68903932403509 | |
| } | |
| ], | |
| "bleu": 0.1344939664526747, | |
| "chrf": 32.68903932403509, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "IN": 5436969, | |
| "PK": 161116 | |
| } | |
| }, | |
| { | |
| "language_name": "Norwegian Bokmål", | |
| "bcp_47": "nb", | |
| "speakers": 5468932, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.3568538739752233, | |
| "chrf": 50.18863565152686 | |
| } | |
| ], | |
| "bleu": 0.3568538739752233, | |
| "chrf": 50.18863565152686, | |
| "commonvoice_hours": 0.1, | |
| "commonvoice_locale": "nb-NO", | |
| "population": { | |
| "NO": 5467440, | |
| "SJ": 1492 | |
| } | |
| }, | |
| { | |
| "language_name": "Bemba", | |
| "bcp_47": "bem", | |
| "speakers": 5402246, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.07496563614353445, | |
| "chrf": 23.431580504923282 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.10425825663987873, | |
| "chrf": 26.156513526794825 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.048552315311727906, | |
| "chrf": 17.052116746764433 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.20820762589055672, | |
| "chrf": 37.899164894105404 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.13037194233770932, | |
| "chrf": 29.069219847377738 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.07919429950933718, | |
| "chrf": 22.45526755754465 | |
| } | |
| ], | |
| "bleu": 0.10759167930545738, | |
| "chrf": 26.01064384625172, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "ZM": 5402246 | |
| } | |
| }, | |
| { | |
| "language_name": "Armenian", | |
| "bcp_47": "hy", | |
| "speakers": 5317273, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2525113198548088, | |
| "chrf": 44.115149170486895 | |
| } | |
| ], | |
| "bleu": 0.2525113198548088, | |
| "chrf": 44.115149170486895, | |
| "commonvoice_hours": 31.0, | |
| "commonvoice_locale": "hy-AM", | |
| "population": { | |
| "AM": 2960894, | |
| "CY": 2787, | |
| "GE": 279790, | |
| "IR": 203816, | |
| "LB": 284420, | |
| "RU": 1190465, | |
| "SY": 349171, | |
| "TR": 45930 | |
| } | |
| }, | |
| { | |
| "language_name": "Northern Sotho", | |
| "bcp_47": "nso", | |
| "speakers": 5307578, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.1287306186367617, | |
| "chrf": 28.538499437787404 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.11431860079235977, | |
| "chrf": 29.789689541768464 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.048032427671766596, | |
| "chrf": 16.511000736562355 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.277532484522071, | |
| "chrf": 43.725160462861595 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.1559013863573944, | |
| "chrf": 31.344526297642712 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.08683694629684643, | |
| "chrf": 24.176752802670837 | |
| } | |
| ], | |
| "bleu": 0.13522541071286664, | |
| "chrf": 29.014271546548898, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "nso", | |
| "population": { | |
| "ZA": 5307578 | |
| } | |
| }, | |
| { | |
| "language_name": "Luo (Kenya and Tanzania)", | |
| "bcp_47": "luo", | |
| "speakers": 5245734, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.07123028733548639, | |
| "chrf": 21.84956735049654 | |
| } | |
| ], | |
| "bleu": 0.07123028733548639, | |
| "chrf": 21.84956735049654, | |
| "commonvoice_hours": 30.0, | |
| "commonvoice_locale": "luo", | |
| "population": { | |
| "KE": 5245734 | |
| } | |
| }, | |
| { | |
| "language_name": "Tok Pisin", | |
| "bcp_47": "tpi", | |
| "speakers": 5154217, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.17665711931817996, | |
| "chrf": 35.46692292627831 | |
| } | |
| ], | |
| "bleu": 0.17665711931817996, | |
| "chrf": 35.46692292627831, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "PG": 5154217 | |
| } | |
| }, | |
| { | |
| "language_name": "Lao", | |
| "bcp_47": "lo", | |
| "speakers": 5138706, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.17291556794348653, | |
| "chrf": 35.37210957380201 | |
| } | |
| ], | |
| "bleu": 0.17291556794348653, | |
| "chrf": 35.37210957380201, | |
| "commonvoice_hours": 0.2, | |
| "commonvoice_locale": "lo", | |
| "population": { | |
| "LA": 5138706 | |
| } | |
| }, | |
| { | |
| "language_name": "Tsonga", | |
| "bcp_47": "ts", | |
| "speakers": 4880932, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.1264498146181144, | |
| "chrf": 26.535888048377064 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.09614725376527729, | |
| "chrf": 26.35974604226704 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.043920591728788254, | |
| "chrf": 15.171343812958735 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.2843690426617385, | |
| "chrf": 43.51952547276378 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.10072669531344912, | |
| "chrf": 24.778318092682298 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.0708900783780892, | |
| "chrf": 24.114324582460767 | |
| } | |
| ], | |
| "bleu": 0.12041724607757613, | |
| "chrf": 26.746524341918285, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "ts", | |
| "population": { | |
| "MZ": 2377758, | |
| "SZ": 18776, | |
| "ZA": 2484398 | |
| } | |
| }, | |
| { | |
| "language_name": "Balinese", | |
| "bcp_47": "ban", | |
| "speakers": 4806468, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.20937766416587725, | |
| "chrf": 37.802202729584685 | |
| } | |
| ], | |
| "bleu": 0.20937766416587725, | |
| "chrf": 37.802202729584685, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "ID": 4806468 | |
| } | |
| }, | |
| { | |
| "language_name": "Ewe", | |
| "bcp_47": "ee", | |
| "speakers": 4690857, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.06328122760447334, | |
| "chrf": 21.930232101484705 | |
| } | |
| ], | |
| "bleu": 0.06328122760447334, | |
| "chrf": 21.930232101484705, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "ee", | |
| "population": { | |
| "GH": 3227422, | |
| "TG": 1463435 | |
| } | |
| }, | |
| { | |
| "language_name": "Buginese", | |
| "bcp_47": "bug", | |
| "speakers": 4298211, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.11888625287150432, | |
| "chrf": 26.566035803697112 | |
| } | |
| ], | |
| "bleu": 0.11888625287150432, | |
| "chrf": 26.566035803697112, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "ID": 4272416, | |
| "MY": 25795 | |
| } | |
| }, | |
| { | |
| "language_name": "Goan Konkani", | |
| "bcp_47": "gom", | |
| "speakers": 4243488, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.17517997036818814, | |
| "chrf": 35.662782661637515 | |
| } | |
| ], | |
| "bleu": 0.17517997036818814, | |
| "chrf": 35.662782661637515, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "gom", | |
| "population": { | |
| "IN": 4243488 | |
| } | |
| }, | |
| { | |
| "language_name": "Kamba", | |
| "bcp_47": "kam", | |
| "speakers": 4068120, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.09766297423802607, | |
| "chrf": 24.328994687372596 | |
| } | |
| ], | |
| "bleu": 0.09766297423802607, | |
| "chrf": 24.328994687372596, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "KE": 4068120 | |
| } | |
| }, | |
| { | |
| "language_name": "Banjar", | |
| "bcp_47": "bjn", | |
| "speakers": 4010288, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.21429523594040997, | |
| "chrf": 37.997802850700054 | |
| } | |
| ], | |
| "bleu": 0.21429523594040997, | |
| "chrf": 37.997802850700054, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "ID": 4005390, | |
| "MY": 4898 | |
| } | |
| }, | |
| { | |
| "language_name": "Lombard", | |
| "bcp_47": "lmo", | |
| "speakers": 3901518, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.19986098660959015, | |
| "chrf": 38.27348032712485 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.21159778572935684, | |
| "chrf": 40.44461475492081 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.1588300738463149, | |
| "chrf": 31.614789846388156 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.30563834118855027, | |
| "chrf": 47.111364119506355 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.22666325208418955, | |
| "chrf": 42.07703156302399 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.18882590620933629, | |
| "chrf": 37.12550972377164 | |
| } | |
| ], | |
| "bleu": 0.215236057611223, | |
| "chrf": 39.44113172245597, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "CH": 344564, | |
| "IT": 3556954 | |
| } | |
| }, | |
| { | |
| "language_name": "Achinese", | |
| "bcp_47": "ace", | |
| "speakers": 3738364, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.16911632683538352, | |
| "chrf": 35.055560798896856 | |
| } | |
| ], | |
| "bleu": 0.16911632683538352, | |
| "chrf": 35.055560798896856, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "ace", | |
| "population": { | |
| "ID": 3738364 | |
| } | |
| }, | |
| { | |
| "language_name": "Shan", | |
| "bcp_47": "shn", | |
| "speakers": 3687984, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.03567194702202585, | |
| "chrf": 15.061253284595894 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.14589621017705648, | |
| "chrf": 32.36640913542123 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.011114664716630177, | |
| "chrf": 9.54345606166579 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.24688742301342204, | |
| "chrf": 43.47153430068834 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.11534595629433392, | |
| "chrf": 32.685789872044445 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.06564720827517354, | |
| "chrf": 21.409820368208937 | |
| } | |
| ], | |
| "bleu": 0.10342723491644035, | |
| "chrf": 25.756377170437435, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "shn", | |
| "population": { | |
| "MM": 3621766, | |
| "TH": 66218 | |
| } | |
| }, | |
| { | |
| "language_name": "Georgian", | |
| "bcp_47": "ka", | |
| "speakers": 3543646, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.22489436376782782, | |
| "chrf": 42.05355918136569 | |
| } | |
| ], | |
| "bleu": 0.22489436376782782, | |
| "chrf": 42.05355918136569, | |
| "commonvoice_hours": 158.0, | |
| "commonvoice_locale": "ka", | |
| "population": { | |
| "GE": 3437420, | |
| "IR": 60296, | |
| "TR": 45930 | |
| } | |
| }, | |
| { | |
| "language_name": "Galician", | |
| "bcp_47": "gl", | |
| "speakers": 3515530, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2463790593991139, | |
| "chrf": 43.16984633200989 | |
| } | |
| ], | |
| "bleu": 0.2463790593991139, | |
| "chrf": 43.16984633200989, | |
| "commonvoice_hours": 109.0, | |
| "commonvoice_locale": "gl", | |
| "population": { | |
| "ES": 3501106, | |
| "PT": 14424 | |
| } | |
| }, | |
| { | |
| "language_name": "Lingala", | |
| "bcp_47": "ln", | |
| "speakers": 3514491, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.10115588577551943, | |
| "chrf": 26.041173534129616 | |
| } | |
| ], | |
| "bleu": 0.10115588577551943, | |
| "chrf": 26.041173534129616, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "ln", | |
| "population": { | |
| "AO": 217899, | |
| "CD": 3155180, | |
| "CF": 14378, | |
| "CG": 127034 | |
| } | |
| }, | |
| { | |
| "language_name": "Kabyle", | |
| "bcp_47": "kab", | |
| "speakers": 3351886, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.03368838568519845, | |
| "chrf": 17.84430440143716 | |
| } | |
| ], | |
| "bleu": 0.03368838568519845, | |
| "chrf": 17.84430440143716, | |
| "commonvoice_hours": 571.0, | |
| "commonvoice_locale": "kab", | |
| "population": { | |
| "DZ": 3351886 | |
| } | |
| }, | |
| { | |
| "language_name": "Kyrgyz", | |
| "bcp_47": "ky", | |
| "speakers": 3338267, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.21002212869070494, | |
| "chrf": 39.3726736717899 | |
| } | |
| ], | |
| "bleu": 0.21002212869070494, | |
| "chrf": 39.3726736717899, | |
| "commonvoice_hours": 39.0, | |
| "commonvoice_locale": "ky", | |
| "population": { | |
| "CN": 473967, | |
| "KG": 2863152, | |
| "TR": 1148 | |
| } | |
| }, | |
| { | |
| "language_name": "Fon", | |
| "bcp_47": "fon", | |
| "speakers": 3216150, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.0832678269022026, | |
| "chrf": 21.627442109362057 | |
| } | |
| ], | |
| "bleu": 0.0832678269022026, | |
| "chrf": 21.627442109362057, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "BJ": 3216150 | |
| } | |
| }, | |
| { | |
| "language_name": "Waray", | |
| "bcp_47": "war", | |
| "speakers": 3166927, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2156899984074879, | |
| "chrf": 38.73293471051519 | |
| } | |
| ], | |
| "bleu": 0.2156899984074879, | |
| "chrf": 38.73293471051519, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "CA": 678, | |
| "PH": 3166249 | |
| } | |
| }, | |
| { | |
| "language_name": "Tibetan", | |
| "bcp_47": "bo", | |
| "speakers": 3006697, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.11883469874802492, | |
| "chrf": 29.188000714511094 | |
| } | |
| ], | |
| "bleu": 0.11883469874802492, | |
| "chrf": 29.188000714511094, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "bo", | |
| "population": { | |
| "CN": 2788040, | |
| "IN": 145870, | |
| "NP": 72787 | |
| } | |
| }, | |
| { | |
| "language_name": "Sango", | |
| "bcp_47": "sg", | |
| "speakers": 2935521, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.052708457503892185, | |
| "chrf": 21.077342933150366 | |
| } | |
| ], | |
| "bleu": 0.052708457503892185, | |
| "chrf": 21.077342933150366, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "CF": 2935521 | |
| } | |
| }, | |
| { | |
| "language_name": "Aymara", | |
| "bcp_47": "ay", | |
| "speakers": 2838620, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.07563412710891973, | |
| "chrf": 23.042901816075858 | |
| } | |
| ], | |
| "bleu": 0.07563412710891973, | |
| "chrf": 23.042901816075858, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "BO": 2327980, | |
| "PE": 510640 | |
| } | |
| }, | |
| { | |
| "language_name": "Dogri", | |
| "bcp_47": "doi", | |
| "speakers": 2652180, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.18698274115592, | |
| "chrf": 36.17811444987121 | |
| } | |
| ], | |
| "bleu": 0.18698274115592, | |
| "chrf": 36.17811444987121, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "IN": 2652180 | |
| } | |
| }, | |
| { | |
| "language_name": "Lithuanian", | |
| "bcp_47": "lt", | |
| "speakers": 2488617, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.23629191535308328, | |
| "chrf": 41.457632804056466 | |
| } | |
| ], | |
| "bleu": 0.23629191535308328, | |
| "chrf": 41.457632804056466, | |
| "commonvoice_hours": 25.0, | |
| "commonvoice_locale": "lt", | |
| "population": { | |
| "GB": 131522, | |
| "LT": 2349056, | |
| "PL": 8039 | |
| } | |
| }, | |
| { | |
| "language_name": "Swati", | |
| "bcp_47": "ss", | |
| "speakers": 2212379, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.10571792263190831, | |
| "chrf": 26.72182646364123 | |
| } | |
| ], | |
| "bleu": 0.10571792263190831, | |
| "chrf": 26.72182646364123, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "ss", | |
| "population": { | |
| "LS": 47264, | |
| "SZ": 640598, | |
| "ZA": 1524517 | |
| } | |
| }, | |
| { | |
| "language_name": "Occitan", | |
| "bcp_47": "oc", | |
| "speakers": 2040398, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.3116700967049491, | |
| "chrf": 49.33859359679982 | |
| } | |
| ], | |
| "bleu": 0.3116700967049491, | |
| "chrf": 49.33859359679982, | |
| "commonvoice_hours": 1.8, | |
| "commonvoice_locale": "oc", | |
| "population": { | |
| "ES": 4952, | |
| "FR": 2035446 | |
| } | |
| }, | |
| { | |
| "language_name": "Tatar", | |
| "bcp_47": "tt", | |
| "speakers": 1984108, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.20199966692246552, | |
| "chrf": 38.969447814905855 | |
| } | |
| ], | |
| "bleu": 0.20199966692246552, | |
| "chrf": 38.969447814905855, | |
| "commonvoice_hours": 32.0, | |
| "commonvoice_locale": "tt", | |
| "population": { | |
| "RU": 1984108 | |
| } | |
| }, | |
| { | |
| "language_name": "Slovenian", | |
| "bcp_47": "sl", | |
| "speakers": 1973181, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.25710751649810404, | |
| "chrf": 43.97419502631293 | |
| } | |
| ], | |
| "bleu": 0.25710751649810404, | |
| "chrf": 43.97419502631293, | |
| "commonvoice_hours": 17.0, | |
| "commonvoice_locale": "sl", | |
| "population": { | |
| "AT": 32780, | |
| "HU": 4984, | |
| "IT": 106085, | |
| "SI": 1829332 | |
| } | |
| }, | |
| { | |
| "language_name": "Bodo", | |
| "bcp_47": "brx", | |
| "speakers": 1856526, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.07193315161893905, | |
| "chrf": 21.198050861825372 | |
| } | |
| ], | |
| "bleu": 0.07193315161893905, | |
| "chrf": 21.198050861825372, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "IN": 1856526 | |
| } | |
| }, | |
| { | |
| "language_name": "Chuvash", | |
| "bcp_47": "cv", | |
| "speakers": 1842386, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.16319209573807847, | |
| "chrf": 35.5605244185656 | |
| } | |
| ], | |
| "bleu": 0.16319209573807847, | |
| "chrf": 35.5605244185656, | |
| "commonvoice_hours": 27.0, | |
| "commonvoice_locale": "cv", | |
| "population": { | |
| "RU": 1842386 | |
| } | |
| }, | |
| { | |
| "language_name": "Bashkir", | |
| "bcp_47": "ba", | |
| "speakers": 1842386, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.23494956875272427, | |
| "chrf": 43.58361096793536 | |
| } | |
| ], | |
| "bleu": 0.23494956875272427, | |
| "chrf": 43.58361096793536, | |
| "commonvoice_hours": 259.0, | |
| "commonvoice_locale": "ba", | |
| "population": { | |
| "RU": 1842386 | |
| } | |
| }, | |
| { | |
| "language_name": "Tumbuka", | |
| "bcp_47": "tum", | |
| "speakers": 1780514, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.09211959148198216, | |
| "chrf": 25.078974624106454 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.08953119623294435, | |
| "chrf": 26.60406076382521 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.036353192983993324, | |
| "chrf": 15.247949668242475 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.21852974820220555, | |
| "chrf": 40.790711915222424 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.13308678184347988, | |
| "chrf": 31.89595169117875 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.06252197708878435, | |
| "chrf": 23.417269345311365 | |
| } | |
| ], | |
| "bleu": 0.10535708130556494, | |
| "chrf": 27.172486334647783, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "MW": 1780514 | |
| } | |
| }, | |
| { | |
| "language_name": "Macedonian", | |
| "bcp_47": "mk", | |
| "speakers": 1608565, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2635416107541368, | |
| "chrf": 46.15461303306508 | |
| } | |
| ], | |
| "bleu": 0.2635416107541368, | |
| "chrf": 46.15461303306508, | |
| "commonvoice_hours": 18.0, | |
| "commonvoice_locale": "mk", | |
| "population": { | |
| "AL": 14451, | |
| "GR": 169714, | |
| "MK": 1424400 | |
| } | |
| }, | |
| { | |
| "language_name": "Pangasinan", | |
| "bcp_47": "pag", | |
| "speakers": 1528534, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.14637588345836686, | |
| "chrf": 33.27328635596556 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.17061619096272593, | |
| "chrf": 35.63408741214199 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.11313843155080379, | |
| "chrf": 26.507505375137484 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.27369890360254523, | |
| "chrf": 44.34141738332121 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.19116528491340065, | |
| "chrf": 36.672507303893106 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.11054650956119119, | |
| "chrf": 30.67803234997905 | |
| } | |
| ], | |
| "bleu": 0.16759020067483896, | |
| "chrf": 34.51780603007307, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "PH": 1528534 | |
| } | |
| }, | |
| { | |
| "language_name": "Manipuri", | |
| "bcp_47": "mni", | |
| "speakers": 1476591, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.061702153982680315, | |
| "chrf": 20.627265799751633 | |
| } | |
| ], | |
| "bleu": 0.061702153982680315, | |
| "chrf": 20.627265799751633, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "mni", | |
| "population": { | |
| "BD": 17892, | |
| "IN": 1458699 | |
| } | |
| }, | |
| { | |
| "language_name": "Venetian", | |
| "bcp_47": "vec", | |
| "speakers": 1380829, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.24764447442173138, | |
| "chrf": 41.97335861313842 | |
| } | |
| ], | |
| "bleu": 0.24764447442173138, | |
| "chrf": 41.97335861313842, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "vec", | |
| "population": { | |
| "BR": 508118, | |
| "HR": 29594, | |
| "IT": 811235, | |
| "MX": 2444, | |
| "SI": 29438 | |
| } | |
| }, | |
| { | |
| "language_name": "Norwegian Nynorsk", | |
| "bcp_47": "nn", | |
| "speakers": 1366860, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.31661912673403325, | |
| "chrf": 48.792392911852595 | |
| } | |
| ], | |
| "bleu": 0.31661912673403325, | |
| "chrf": 48.792392911852595, | |
| "commonvoice_hours": 1.5, | |
| "commonvoice_locale": "nn-NO", | |
| "population": { | |
| "NO": 1366860 | |
| } | |
| }, | |
| { | |
| "language_name": "Irish", | |
| "bcp_47": "ga", | |
| "speakers": 1237487, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2768559181644857, | |
| "chrf": 46.47151564403362 | |
| } | |
| ], | |
| "bleu": 0.2768559181644857, | |
| "chrf": 46.47151564403362, | |
| "commonvoice_hours": 5.8, | |
| "commonvoice_locale": "ga-IE", | |
| "population": { | |
| "GB": 98642, | |
| "IE": 1138845 | |
| } | |
| }, | |
| { | |
| "language_name": "Latvian", | |
| "bcp_47": "lv", | |
| "speakers": 1147550, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.23200427142275887, | |
| "chrf": 44.00679383253316 | |
| } | |
| ], | |
| "bleu": 0.23200427142275887, | |
| "chrf": 44.00679383253316, | |
| "commonvoice_hours": 260.0, | |
| "commonvoice_locale": "lv", | |
| "population": { | |
| "LV": 1147550 | |
| } | |
| }, | |
| { | |
| "language_name": "Basque", | |
| "bcp_47": "eu", | |
| "speakers": 1088519, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.1907277513380933, | |
| "chrf": 40.633564870804214 | |
| } | |
| ], | |
| "bleu": 0.1907277513380933, | |
| "chrf": 40.633564870804214, | |
| "commonvoice_hours": 335.0, | |
| "commonvoice_locale": "eu", | |
| "population": { | |
| "ES": 1000316, | |
| "FR": 88203 | |
| } | |
| }, | |
| { | |
| "language_name": "Sardinian", | |
| "bcp_47": "sc", | |
| "speakers": 1060846, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2003666163856343, | |
| "chrf": 39.97859549386356 | |
| } | |
| ], | |
| "bleu": 0.2003666163856343, | |
| "chrf": 39.97859549386356, | |
| "commonvoice_hours": 2.9, | |
| "commonvoice_locale": "sc", | |
| "population": { | |
| "IT": 1060846 | |
| } | |
| }, | |
| { | |
| "language_name": "Najdi Arabic", | |
| "bcp_47": "ars", | |
| "speakers": 1025205, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.26325866988203733, | |
| "chrf": 45.79452460253912 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.25411630061861235, | |
| "chrf": 45.68081123321704 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.19634428413472024, | |
| "chrf": 37.402576382999925 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.3267312117229826, | |
| "chrf": 50.07524798517934 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.27947088689796734, | |
| "chrf": 47.70370329275568 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.23043700347741075, | |
| "chrf": 40.64509062227617 | |
| } | |
| ], | |
| "bleu": 0.2583930594556218, | |
| "chrf": 44.550325686494546, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "SA": 1025205 | |
| } | |
| }, | |
| { | |
| "language_name": "Yiddish", | |
| "bcp_47": "yi", | |
| "speakers": 997214, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2748989006328114, | |
| "chrf": 44.151717001541904 | |
| } | |
| ], | |
| "bleu": 0.2748989006328114, | |
| "chrf": 44.151717001541904, | |
| "commonvoice_hours": 0.5, | |
| "commonvoice_locale": "yi", | |
| "population": { | |
| "IL": 260264, | |
| "SE": 2959, | |
| "UA": 570998, | |
| "US": 162993 | |
| } | |
| }, | |
| { | |
| "language_name": "Kachin", | |
| "bcp_47": "kac", | |
| "speakers": 962032, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.06343642810657522, | |
| "chrf": 21.96116119019238 | |
| } | |
| ], | |
| "bleu": 0.06343642810657522, | |
| "chrf": 21.96116119019238, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "MM": 962032 | |
| } | |
| }, | |
| { | |
| "language_name": "Limburgish", | |
| "bcp_47": "li", | |
| "speakers": 950422, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.28017358847160223, | |
| "chrf": 45.82764538788154 | |
| } | |
| ], | |
| "bleu": 0.28017358847160223, | |
| "chrf": 45.82764538788154, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "NL": 950422 | |
| } | |
| }, | |
| { | |
| "language_name": "Welsh", | |
| "bcp_47": "cy", | |
| "speakers": 884910, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.31667961925197524, | |
| "chrf": 48.49344578612579 | |
| } | |
| ], | |
| "bleu": 0.31667961925197524, | |
| "chrf": 48.49344578612579, | |
| "commonvoice_hours": 124.0, | |
| "commonvoice_locale": "cy", | |
| "population": { | |
| "AR": 30016, | |
| "GB": 854894 | |
| } | |
| }, | |
| { | |
| "language_name": "Estonian", | |
| "bcp_47": "et", | |
| "speakers": 878449, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.23762161272302187, | |
| "chrf": 42.90409268311042 | |
| } | |
| ], | |
| "bleu": 0.23762161272302187, | |
| "chrf": 42.90409268311042, | |
| "commonvoice_hours": 58.0, | |
| "commonvoice_locale": "et", | |
| "population": { | |
| "EE": 872320, | |
| "FI": 6129 | |
| } | |
| }, | |
| { | |
| "language_name": "Asturian", | |
| "bcp_47": "ast", | |
| "speakers": 650205, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.3066166431048003, | |
| "chrf": 47.792858053998366 | |
| } | |
| ], | |
| "bleu": 0.3066166431048003, | |
| "chrf": 47.792858053998366, | |
| "commonvoice_hours": 0.7, | |
| "commonvoice_locale": "ast", | |
| "population": { | |
| "ES": 650205 | |
| } | |
| }, | |
| { | |
| "language_name": "N’Ko", | |
| "bcp_47": "nqo", | |
| "speakers": 626370, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.0026829540009563496, | |
| "chrf": 8.366238228343608 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.0028810767141941676, | |
| "chrf": 11.711522538883516 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.002244809403558117, | |
| "chrf": 6.87154254960649 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.1373860974763018, | |
| "chrf": 29.63649387292498 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.005449384832055512, | |
| "chrf": 13.63303465097306 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.001220306675003964, | |
| "chrf": 11.614232149229839 | |
| } | |
| ], | |
| "bleu": 0.02531077151701165, | |
| "chrf": 13.638843998326914, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "nqo", | |
| "population": { | |
| "GN": 626370 | |
| } | |
| }, | |
| { | |
| "language_name": "Nuer", | |
| "bcp_47": "nus", | |
| "speakers": 591427, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.04422064781985695, | |
| "chrf": 18.101658717442856 | |
| } | |
| ], | |
| "bleu": 0.04422064781985695, | |
| "chrf": 18.101658717442856, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "SS": 591427 | |
| } | |
| }, | |
| { | |
| "language_name": "Ligurian", | |
| "bcp_47": "lij", | |
| "speakers": 536663, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.2433180508520944, | |
| "chrf": 42.16628456571689 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2730358021257564, | |
| "chrf": 43.59770121161605 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.1659569541464764, | |
| "chrf": 32.04882604989477 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.3868854055493315, | |
| "chrf": 52.982923067584665 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.30131335750773747, | |
| "chrf": 47.80059076162273 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.22953082347299453, | |
| "chrf": 39.89195612874355 | |
| } | |
| ], | |
| "bleu": 0.26667339894239844, | |
| "chrf": 43.08138029752978, | |
| "commonvoice_hours": 5.1, | |
| "commonvoice_locale": "lij", | |
| "population": { | |
| "IT": 536663 | |
| } | |
| }, | |
| { | |
| "language_name": "Kabuverdianu", | |
| "bcp_47": "kea", | |
| "speakers": 530762, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2049568393036302, | |
| "chrf": 39.12735936405683 | |
| } | |
| ], | |
| "bleu": 0.2049568393036302, | |
| "chrf": 39.12735936405683, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "CV": 530762 | |
| } | |
| }, | |
| { | |
| "language_name": "Mari", | |
| "bcp_47": "chm", | |
| "speakers": 524371, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.1477332953533076, | |
| "chrf": 33.28969144955911 | |
| } | |
| ], | |
| "bleu": 0.1477332953533076, | |
| "chrf": 33.28969144955911, | |
| "commonvoice_hours": 282.0, | |
| "commonvoice_locale": "mhr", | |
| "population": { | |
| "RU": 524371 | |
| } | |
| }, | |
| { | |
| "language_name": "Sicilian", | |
| "bcp_47": "scn", | |
| "speakers": 511702, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.26991391704955275, | |
| "chrf": 44.10988575231252 | |
| } | |
| ], | |
| "bleu": 0.26991391704955275, | |
| "chrf": 44.10988575231252, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "scn", | |
| "population": { | |
| "IT": 511702 | |
| } | |
| }, | |
| { | |
| "language_name": "Silesian", | |
| "bcp_47": "szl", | |
| "speakers": 497670, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2478859256009672, | |
| "chrf": 42.936549641246145 | |
| } | |
| ], | |
| "bleu": 0.2478859256009672, | |
| "chrf": 42.936549641246145, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "PL": 497670 | |
| } | |
| }, | |
| { | |
| "language_name": "Maltese", | |
| "bcp_47": "mt", | |
| "speakers": 457267, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.27335683193570975, | |
| "chrf": 45.920903610737895 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.28654849898846085, | |
| "chrf": 46.936205424540766 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.15248109554681186, | |
| "chrf": 30.516627088468166 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.38954095833662916, | |
| "chrf": 54.945196672005885 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.3175303995061197, | |
| "chrf": 51.04064318379729 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.11179045198515461, | |
| "chrf": 30.191257026189298 | |
| } | |
| ], | |
| "bleu": 0.2552080393831477, | |
| "chrf": 43.25847216762322, | |
| "commonvoice_hours": 8.7, | |
| "commonvoice_locale": "mt", | |
| "population": { | |
| "MT": 457267 | |
| } | |
| }, | |
| { | |
| "language_name": "Luxembourgish", | |
| "bcp_47": "lb", | |
| "speakers": 421015, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2835765541228824, | |
| "chrf": 44.80618475111259 | |
| } | |
| ], | |
| "bleu": 0.2835765541228824, | |
| "chrf": 44.80618475111259, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "lb", | |
| "population": { | |
| "LU": 421015 | |
| } | |
| }, | |
| { | |
| "language_name": "Dzongkha", | |
| "bcp_47": "dz", | |
| "speakers": 370341, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.05723633975042216, | |
| "chrf": 23.461346449303786 | |
| } | |
| ], | |
| "bleu": 0.05723633975042216, | |
| "chrf": 23.461346449303786, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "BT": 367689, | |
| "IN": 2652 | |
| } | |
| }, | |
| { | |
| "language_name": "Fijian", | |
| "bcp_47": "fj", | |
| "speakers": 365030, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.10451524271139898, | |
| "chrf": 24.713018515709646 | |
| } | |
| ], | |
| "bleu": 0.10451524271139898, | |
| "chrf": 24.713018515709646, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "FJ": 365030 | |
| } | |
| }, | |
| { | |
| "language_name": "Icelandic", | |
| "bcp_47": "is", | |
| "speakers": 350734, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2142644347281729, | |
| "chrf": 40.04812999157868 | |
| } | |
| ], | |
| "bleu": 0.2142644347281729, | |
| "chrf": 40.04812999157868, | |
| "commonvoice_hours": 0.1, | |
| "commonvoice_locale": "is", | |
| "population": { | |
| "IS": 350734 | |
| } | |
| }, | |
| { | |
| "language_name": "Samoan", | |
| "bcp_47": "sm", | |
| "speakers": 252717, | |
| "scores": [ | |
| { | |
| "model": "openai/gpt-4o-mini", | |
| "bleu": 0.13327372905795537, | |
| "chrf": 28.9583532166856 | |
| }, | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.11602460228698847, | |
| "chrf": 29.156949243212015 | |
| }, | |
| { | |
| "model": "mistralai/mistral-small-24b-instruct-2501", | |
| "bleu": 0.05771585788755527, | |
| "chrf": 16.752178728973906 | |
| }, | |
| { | |
| "model": "google/gemini-2.0-flash-001", | |
| "bleu": 0.2585259997356889, | |
| "chrf": 45.18784342425295 | |
| }, | |
| { | |
| "model": "deepseek/deepseek-chat", | |
| "bleu": 0.22221137013078898, | |
| "chrf": 39.7496231353589 | |
| }, | |
| { | |
| "model": "microsoft/phi-4", | |
| "bleu": 0.04756300118196289, | |
| "chrf": 21.060764155029197 | |
| } | |
| ], | |
| "bleu": 0.13921909338015664, | |
| "chrf": 30.144285317252095, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "AS": 48943, | |
| "WS": 203774 | |
| } | |
| }, | |
| { | |
| "language_name": "Crimean Tatar", | |
| "bcp_47": "crh", | |
| "speakers": 245968, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.22725256040555009, | |
| "chrf": 42.07005703444819 | |
| } | |
| ], | |
| "bleu": 0.22725256040555009, | |
| "chrf": 42.07005703444819, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "crh", | |
| "population": { | |
| "UA": 245968 | |
| } | |
| }, | |
| { | |
| "language_name": "Papiamento", | |
| "bcp_47": "pap", | |
| "speakers": 211640, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.21648792499796674, | |
| "chrf": 41.57061175824069 | |
| } | |
| ], | |
| "bleu": 0.21648792499796674, | |
| "chrf": 41.57061175824069, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "pap-AW", | |
| "population": { | |
| "AW": 72851, | |
| "BQ": 16200, | |
| "CW": 122589 | |
| } | |
| }, | |
| { | |
| "language_name": "Latgalian", | |
| "bcp_47": "ltg", | |
| "speakers": 167429, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.13475273241606922, | |
| "chrf": 32.044009672423776 | |
| } | |
| ], | |
| "bleu": 0.13475273241606922, | |
| "chrf": 32.044009672423776, | |
| "commonvoice_hours": 28.0, | |
| "commonvoice_locale": "ltg", | |
| "population": { | |
| "LV": 167429 | |
| } | |
| }, | |
| { | |
| "language_name": "Māori", | |
| "bcp_47": "mi", | |
| "speakers": 137913, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.17610729049259877, | |
| "chrf": 35.01961886760811 | |
| } | |
| ], | |
| "bleu": 0.17610729049259877, | |
| "chrf": 35.01961886760811, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "NZ": 137913 | |
| } | |
| }, | |
| { | |
| "language_name": "Scottish Gaelic", | |
| "bcp_47": "gd", | |
| "speakers": 72337, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2154279041570466, | |
| "chrf": 37.40630914857015 | |
| } | |
| ], | |
| "bleu": 0.2154279041570466, | |
| "chrf": 37.40630914857015, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "GB": 72337 | |
| } | |
| }, | |
| { | |
| "language_name": "Faroese", | |
| "bcp_47": "fo", | |
| "speakers": 71351, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.21180629663838063, | |
| "chrf": 39.28673819745006 | |
| } | |
| ], | |
| "bleu": 0.21180629663838063, | |
| "chrf": 39.28673819745006, | |
| "commonvoice_hours": 0.0, | |
| "commonvoice_locale": "fo", | |
| "population": { | |
| "DK": 22304, | |
| "FO": 49047 | |
| } | |
| }, | |
| { | |
| "language_name": "Friulian", | |
| "bcp_47": "fur", | |
| "speakers": 37442, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.2255876860328074, | |
| "chrf": 40.6191779521821 | |
| } | |
| ], | |
| "bleu": 0.2255876860328074, | |
| "chrf": 40.6191779521821, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "IT": 37442 | |
| } | |
| }, | |
| { | |
| "language_name": "Sanskrit", | |
| "bcp_47": "sa", | |
| "speakers": 15913, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.14313294345831834, | |
| "chrf": 32.44676491537583 | |
| } | |
| ], | |
| "bleu": 0.14313294345831834, | |
| "chrf": 32.44676491537583, | |
| "commonvoice_hours": null, | |
| "commonvoice_locale": null, | |
| "population": { | |
| "IN": 15913 | |
| } | |
| }, | |
| { | |
| "language_name": "Esperanto", | |
| "bcp_47": "eo", | |
| "speakers": 301, | |
| "scores": [ | |
| { | |
| "model": "meta-llama/llama-3.3-70b-instruct", | |
| "bleu": 0.27440987441620224, | |
| "chrf": 44.40715599582661 | |
| } | |
| ], | |
| "bleu": 0.27440987441620224, | |
| "chrf": 44.40715599582661, | |
| "commonvoice_hours": 1436.0, | |
| "commonvoice_locale": "eo", | |
| "population": { | |
| "SM": 301 | |
| } | |
| } | |
| ] |